//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-31968024
// Cuda compilation tools, release 12.0, V12.0.76
// Based on NVVM 7.0.1
//

.version 8.0
.target sm_52
.address_size 64

	// .globl	__raygen__oxMain
.const .align 16 .b8 params[384];
.global .align 4 .b8 __cudart_i2opi_f[24] = {65, 144, 67, 60, 153, 149, 98, 219, 192, 221, 52, 245, 209, 87, 39, 252, 41, 21, 68, 78, 110, 131, 249, 162};

.visible .entry __raygen__oxMain()
{
	.local .align 4 .b8 	__local_depot0[28];
	.reg .b64 	%SP;
	.reg .b64 	%SPL;
	.reg .pred 	%p<177>;
	.reg .b16 	%rs<17>;
	.reg .f32 	%f<1447>;
	.reg .b32 	%r<766>;
	.reg .f64 	%fd<13>;
	.reg .b64 	%rd<179>;


	mov.u64 	%SPL, __local_depot0;
	add.u64 	%rd1, %SPL, 0;
	// begin inline asm
	call (%r155), _optix_get_launch_index_x, ();
	// end inline asm
	// begin inline asm
	call (%r156), _optix_get_launch_index_y, ();
	// end inline asm
	// begin inline asm
	call (%r158), _optix_get_launch_dimension_x, ();
	// end inline asm
	// begin inline asm
	call (%r159), _optix_get_launch_dimension_y, ();
	// end inline asm
	ld.const.v4.u32 	{%r161, %r162, %r163, %r164}, [params+352];
	add.s32 	%r169, %r161, %r155;
	and.b32  	%r170, %r169, 255;
	add.s32 	%r171, %r162, %r156;
	and.b32  	%r172, %r171, 255;
	add.s32 	%r173, %r163, %r155;
	and.b32  	%r174, %r173, 255;
	add.s32 	%r175, %r164, %r156;
	and.b32  	%r176, %r175, 255;
	ld.const.u64 	%rd47, [params+192];
	cvta.to.global.u64 	%rd48, %rd47;
	ld.const.u32 	%r177, [params+184];
	mad.lo.s32 	%r178, %r177, %r172, %r170;
	mul.wide.u32 	%rd49, %r178, 3;
	add.s64 	%rd50, %rd48, %rd49;
	ld.global.u8 	%rs3, [%rd50];
	cvt.rn.f32.u16 	%f359, %rs3;
	div.rn.f32 	%f1, %f359, 0f437F0000;
	ld.global.u8 	%rs4, [%rd50+1];
	cvt.rn.f32.u16 	%f360, %rs4;
	div.rn.f32 	%f2, %f360, 0f437F0000;
	ld.global.u8 	%rs5, [%rd50+2];
	cvt.rn.f32.u16 	%f361, %rs5;
	div.rn.f32 	%f3, %f361, 0f437F0000;
	mad.lo.s32 	%r179, %r177, %r176, %r174;
	mul.wide.u32 	%rd51, %r179, 3;
	add.s64 	%rd2, %rd48, %rd51;
	ld.const.u32 	%r5, [params+340];
	setp.eq.s32 	%p5, %r5, 0;
	@%p5 bra 	$L__BB0_26;

	ld.global.u8 	%rs6, [%rd2];
	cvt.rn.f32.u16 	%f362, %rs6;
	div.rn.f32 	%f363, %f362, 0f437F0000;
	ld.global.u8 	%rs7, [%rd2+1];
	cvt.rn.f32.u16 	%f364, %rs7;
	div.rn.f32 	%f365, %f364, 0f437F0000;
	ld.const.u64 	%rd52, [params+144];
	cvta.to.global.u64 	%rd53, %rd52;
	ld.const.u32 	%r180, [params+136];
	mad.lo.s32 	%r181, %r180, %r156, %r155;
	mul.wide.u32 	%rd54, %r181, 12;
	add.s64 	%rd55, %rd53, %rd54;
	ld.global.f32 	%f1360, [%rd55];
	ld.global.f32 	%f1361, [%rd55+4];
	ld.global.f32 	%f1362, [%rd55+8];
	ld.const.u64 	%rd56, [params+160];
	cvta.to.global.u64 	%rd57, %rd56;
	ld.const.u32 	%r182, [params+152];
	mad.lo.s32 	%r183, %r182, %r156, %r155;
	mul.wide.u32 	%rd58, %r183, 12;
	add.s64 	%rd59, %rd57, %rd58;
	ld.global.f32 	%f7, [%rd59];
	abs.f32 	%f366, %f7;
	ld.global.f32 	%f8, [%rd59+8];
	abs.f32 	%f367, %f8;
	setp.gt.f32 	%p6, %f366, %f367;
	ld.global.f32 	%f9, [%rd59+4];
	neg.f32 	%f368, %f9;
	neg.f32 	%f369, %f8;
	selp.f32 	%f370, %f368, 0f00000000, %p6;
	selp.f32 	%f371, %f7, %f369, %p6;
	selp.f32 	%f372, 0f00000000, %f9, %p6;
	mul.f32 	%f373, %f371, %f371;
	fma.rn.f32 	%f374, %f370, %f370, %f373;
	fma.rn.f32 	%f375, %f372, %f372, %f374;
	sqrt.rn.f32 	%f376, %f375;
	rcp.rn.f32 	%f377, %f376;
	mul.f32 	%f10, %f370, %f377;
	mul.f32 	%f11, %f371, %f377;
	mul.f32 	%f12, %f372, %f377;
	sqrt.rn.f32 	%f13, %f363;
	mul.f32 	%f14, %f365, 0f40C90FDB;
	mul.f32 	%f378, %f14, 0f3F22F983;
	cvt.rni.s32.f32 	%r749, %f378;
	cvt.rn.f32.s32 	%f379, %r749;
	mov.f32 	%f380, 0fBFC90FDA;
	fma.rn.f32 	%f381, %f379, %f380, %f14;
	mov.f32 	%f382, 0fB3A22168;
	fma.rn.f32 	%f383, %f379, %f382, %f381;
	mov.f32 	%f384, 0fA7C234C5;
	fma.rn.f32 	%f1354, %f379, %f384, %f383;
	abs.f32 	%f16, %f14;
	setp.ltu.f32 	%p7, %f16, 0f47CE4780;
	mov.u32 	%r745, %r749;
	mov.f32 	%f1351, %f1354;
	@%p7 bra 	$L__BB0_9;

	setp.eq.f32 	%p8, %f16, 0f7F800000;
	@%p8 bra 	$L__BB0_8;
	bra.uni 	$L__BB0_3;

$L__BB0_8:
	mov.f32 	%f387, 0f00000000;
	mul.rn.f32 	%f1351, %f14, %f387;
	mov.u32 	%r745, 0;
	bra.uni 	$L__BB0_9;

$L__BB0_26:
	ld.const.v4.f32 	{%f437, %f1360, %f1361, %f1362}, [params+304];
	cvt.rn.f32.u32 	%f442, %r159;
	cvt.rn.f32.u32 	%f443, %r158;
	div.rn.f32 	%f444, %f443, %f442;
	cvt.rn.f32.u32 	%f445, %r155;
	add.f32 	%f446, %f1, %f445;
	div.rn.f32 	%f447, %f446, %f443;
	cvt.rn.f32.u32 	%f448, %r156;
	add.f32 	%f449, %f2, %f448;
	div.rn.f32 	%f450, %f449, %f442;
	fma.rn.f32 	%f451, %f447, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f452, %f450, 0f40000000, 0fBF800000;
	ld.const.f32 	%f453, [params+320];
	mul.f32 	%f454, %f444, %f453;
	ld.const.v4.f32 	{%f455, %f456, %f457, %f458}, [params+272];
	mul.f32 	%f463, %f451, %f455;
	mul.f32 	%f464, %f451, %f456;
	mul.f32 	%f465, %f451, %f457;
	ld.const.v4.f32 	{%f466, %f467, %f468, %f469}, [params+288];
	fma.rn.f32 	%f474, %f454, %f463, %f468;
	fma.rn.f32 	%f475, %f454, %f464, %f469;
	fma.rn.f32 	%f476, %f454, %f465, %f437;
	mul.f32 	%f477, %f452, %f458;
	mul.f32 	%f478, %f452, %f466;
	mul.f32 	%f479, %f452, %f467;
	fma.rn.f32 	%f480, %f453, %f477, %f474;
	fma.rn.f32 	%f481, %f453, %f478, %f475;
	fma.rn.f32 	%f482, %f453, %f479, %f476;
	mul.f32 	%f483, %f481, %f481;
	fma.rn.f32 	%f484, %f480, %f480, %f483;
	fma.rn.f32 	%f485, %f482, %f482, %f484;
	sqrt.rn.f32 	%f486, %f485;
	rcp.rn.f32 	%f487, %f486;
	mul.f32 	%f1357, %f480, %f487;
	mul.f32 	%f1358, %f481, %f487;
	mul.f32 	%f1359, %f487, %f482;
	bra.uni 	$L__BB0_27;

$L__BB0_3:
	mov.b32 	%r7, %f14;
	bfe.u32 	%r185, %r7, 23, 8;
	add.s32 	%r8, %r185, -128;
	shl.b32 	%r186, %r7, 8;
	or.b32  	%r9, %r186, -2147483648;
	shr.u32 	%r10, %r8, 5;
	mov.u64 	%rd163, 0;
	mov.u32 	%r742, 0;
	mov.u64 	%rd162, __cudart_i2opi_f;
	mov.u64 	%rd161, %rd1;

$L__BB0_4:
	.pragma "nounroll";
	ld.global.nc.u32 	%r187, [%rd162];
	mad.wide.u32 	%rd62, %r187, %r9, %rd163;
	shr.u64 	%rd163, %rd62, 32;
	st.local.u32 	[%rd161], %rd62;
	add.s64 	%rd162, %rd162, 4;
	add.s64 	%rd161, %rd161, 4;
	add.s32 	%r742, %r742, 1;
	setp.ne.s32 	%p9, %r742, 6;
	@%p9 bra 	$L__BB0_4;

	st.local.u32 	[%rd1+24], %rd163;
	mov.u32 	%r188, 4;
	sub.s32 	%r13, %r188, %r10;
	mov.u32 	%r189, 6;
	sub.s32 	%r190, %r189, %r10;
	mul.wide.s32 	%rd63, %r190, 4;
	add.s64 	%rd64, %rd1, %rd63;
	ld.local.u32 	%r743, [%rd64];
	ld.local.u32 	%r744, [%rd64+-4];
	and.b32  	%r16, %r8, 31;
	setp.eq.s32 	%p10, %r16, 0;
	@%p10 bra 	$L__BB0_7;

	mov.u32 	%r191, 32;
	sub.s32 	%r192, %r191, %r16;
	shr.u32 	%r193, %r744, %r192;
	shl.b32 	%r194, %r743, %r16;
	add.s32 	%r743, %r193, %r194;
	mul.wide.s32 	%rd65, %r13, 4;
	add.s64 	%rd66, %rd1, %rd65;
	ld.local.u32 	%r195, [%rd66];
	shr.u32 	%r196, %r195, %r192;
	shl.b32 	%r197, %r744, %r16;
	add.s32 	%r744, %r196, %r197;

$L__BB0_7:
	and.b32  	%r198, %r7, -2147483648;
	shr.u32 	%r199, %r744, 30;
	shl.b32 	%r200, %r743, 2;
	or.b32  	%r201, %r199, %r200;
	shr.u32 	%r202, %r201, 31;
	shr.u32 	%r203, %r743, 30;
	add.s32 	%r204, %r202, %r203;
	neg.s32 	%r205, %r204;
	setp.eq.s32 	%p11, %r198, 0;
	selp.b32 	%r745, %r204, %r205, %p11;
	setp.ne.s32 	%p12, %r202, 0;
	xor.b32  	%r206, %r198, -2147483648;
	selp.b32 	%r207, %r206, %r198, %p12;
	selp.b32 	%r208, -1, 0, %p12;
	xor.b32  	%r209, %r201, %r208;
	shl.b32 	%r210, %r744, 2;
	xor.b32  	%r211, %r210, %r208;
	cvt.u64.u32 	%rd67, %r209;
	cvt.u64.u32 	%rd68, %r211;
	bfi.b64 	%rd69, %rd67, %rd68, 32, 32;
	cvt.rn.f64.s64 	%fd1, %rd69;
	mul.f64 	%fd2, %fd1, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f385, %fd2;
	setp.eq.s32 	%p13, %r207, 0;
	neg.f32 	%f386, %f385;
	selp.f32 	%f1351, %f385, %f386, %p13;

$L__BB0_9:
	add.s32 	%r23, %r745, 1;
	and.b32  	%r24, %r23, 1;
	setp.eq.s32 	%p14, %r24, 0;
	selp.f32 	%f20, %f1351, 0f3F800000, %p14;
	mul.rn.f32 	%f21, %f1351, %f1351;
	mov.f32 	%f1352, 0fB94D4153;
	@%p14 bra 	$L__BB0_11;

	mov.f32 	%f389, 0fBAB607ED;
	mov.f32 	%f390, 0f37CBAC00;
	fma.rn.f32 	%f1352, %f390, %f21, %f389;

$L__BB0_11:
	selp.f32 	%f391, 0f3C0885E4, 0f3D2AAABB, %p14;
	fma.rn.f32 	%f392, %f1352, %f21, %f391;
	selp.f32 	%f393, 0fBE2AAAA8, 0fBEFFFFFF, %p14;
	fma.rn.f32 	%f394, %f392, %f21, %f393;
	mov.f32 	%f395, 0f00000000;
	fma.rn.f32 	%f396, %f21, %f20, %f395;
	fma.rn.f32 	%f1353, %f394, %f396, %f20;
	and.b32  	%r213, %r23, 2;
	setp.eq.s32 	%p16, %r213, 0;
	@%p16 bra 	$L__BB0_13;

	mov.f32 	%f398, 0fBF800000;
	fma.rn.f32 	%f1353, %f1353, %f398, %f395;

$L__BB0_13:
	@%p7 bra 	$L__BB0_21;

	setp.eq.f32 	%p18, %f16, 0f7F800000;
	@%p18 bra 	$L__BB0_20;
	bra.uni 	$L__BB0_15;

$L__BB0_20:
	mov.f32 	%f401, 0f00000000;
	mul.rn.f32 	%f1354, %f14, %f401;
	mov.u32 	%r749, 0;
	bra.uni 	$L__BB0_21;

$L__BB0_15:
	mov.b32 	%r25, %f14;
	bfe.u32 	%r215, %r25, 23, 8;
	add.s32 	%r26, %r215, -128;
	shl.b32 	%r216, %r25, 8;
	or.b32  	%r27, %r216, -2147483648;
	shr.u32 	%r28, %r26, 5;
	mov.u64 	%rd166, 0;
	mov.u32 	%r746, 0;
	mov.u64 	%rd165, __cudart_i2opi_f;
	mov.u64 	%rd164, %rd1;

$L__BB0_16:
	.pragma "nounroll";
	ld.global.nc.u32 	%r217, [%rd165];
	mad.wide.u32 	%rd72, %r217, %r27, %rd166;
	shr.u64 	%rd166, %rd72, 32;
	st.local.u32 	[%rd164], %rd72;
	add.s64 	%rd165, %rd165, 4;
	add.s64 	%rd164, %rd164, 4;
	add.s32 	%r746, %r746, 1;
	setp.ne.s32 	%p19, %r746, 6;
	@%p19 bra 	$L__BB0_16;

	st.local.u32 	[%rd1+24], %rd166;
	mov.u32 	%r218, 4;
	sub.s32 	%r31, %r218, %r28;
	mov.u32 	%r219, 6;
	sub.s32 	%r220, %r219, %r28;
	mul.wide.s32 	%rd73, %r220, 4;
	add.s64 	%rd74, %rd1, %rd73;
	ld.local.u32 	%r747, [%rd74];
	ld.local.u32 	%r748, [%rd74+-4];
	and.b32  	%r34, %r26, 31;
	setp.eq.s32 	%p20, %r34, 0;
	@%p20 bra 	$L__BB0_19;

	mov.u32 	%r221, 32;
	sub.s32 	%r222, %r221, %r34;
	shr.u32 	%r223, %r748, %r222;
	shl.b32 	%r224, %r747, %r34;
	add.s32 	%r747, %r223, %r224;
	mul.wide.s32 	%rd75, %r31, 4;
	add.s64 	%rd76, %rd1, %rd75;
	ld.local.u32 	%r225, [%rd76];
	shr.u32 	%r226, %r225, %r222;
	shl.b32 	%r227, %r748, %r34;
	add.s32 	%r748, %r226, %r227;

$L__BB0_19:
	and.b32  	%r228, %r25, -2147483648;
	shr.u32 	%r229, %r748, 30;
	shl.b32 	%r230, %r747, 2;
	or.b32  	%r231, %r229, %r230;
	shr.u32 	%r232, %r231, 31;
	shr.u32 	%r233, %r747, 30;
	add.s32 	%r234, %r232, %r233;
	neg.s32 	%r235, %r234;
	setp.eq.s32 	%p21, %r228, 0;
	selp.b32 	%r749, %r234, %r235, %p21;
	setp.ne.s32 	%p22, %r232, 0;
	xor.b32  	%r236, %r228, -2147483648;
	selp.b32 	%r237, %r236, %r228, %p22;
	selp.b32 	%r238, -1, 0, %p22;
	xor.b32  	%r239, %r231, %r238;
	shl.b32 	%r240, %r748, 2;
	xor.b32  	%r241, %r240, %r238;
	cvt.u64.u32 	%rd77, %r239;
	cvt.u64.u32 	%rd78, %r241;
	bfi.b64 	%rd79, %rd77, %rd78, 32, 32;
	cvt.rn.f64.s64 	%fd3, %rd79;
	mul.f64 	%fd4, %fd3, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f399, %fd4;
	setp.eq.s32 	%p23, %r237, 0;
	neg.f32 	%f400, %f399;
	selp.f32 	%f1354, %f399, %f400, %p23;

$L__BB0_21:
	mul.f32 	%f30, %f13, %f1353;
	and.b32  	%r41, %r749, 1;
	setp.eq.s32 	%p24, %r41, 0;
	selp.f32 	%f31, %f1354, 0f3F800000, %p24;
	mul.rn.f32 	%f32, %f1354, %f1354;
	mov.f32 	%f1355, 0fB94D4153;
	@%p24 bra 	$L__BB0_23;

	mov.f32 	%f403, 0fBAB607ED;
	mov.f32 	%f404, 0f37CBAC00;
	fma.rn.f32 	%f1355, %f404, %f32, %f403;

$L__BB0_23:
	selp.f32 	%f405, 0f3C0885E4, 0f3D2AAABB, %p24;
	fma.rn.f32 	%f406, %f1355, %f32, %f405;
	selp.f32 	%f407, 0fBE2AAAA8, 0fBEFFFFFF, %p24;
	fma.rn.f32 	%f408, %f406, %f32, %f407;
	mov.f32 	%f409, 0f00000000;
	fma.rn.f32 	%f410, %f32, %f31, %f409;
	fma.rn.f32 	%f1356, %f408, %f410, %f31;
	and.b32  	%r243, %r749, 2;
	setp.eq.s32 	%p26, %r243, 0;
	@%p26 bra 	$L__BB0_25;

	mov.f32 	%f412, 0fBF800000;
	fma.rn.f32 	%f1356, %f1356, %f412, %f409;

$L__BB0_25:
	mul.f32 	%f413, %f30, %f30;
	mov.f32 	%f414, 0f3F800000;
	sub.f32 	%f415, %f414, %f413;
	mul.f32 	%f416, %f13, %f1356;
	mul.f32 	%f417, %f416, %f416;
	sub.f32 	%f418, %f415, %f417;
	max.f32 	%f420, %f409, %f418;
	sqrt.rn.f32 	%f421, %f420;
	mul.f32 	%f422, %f10, %f416;
	mul.f32 	%f423, %f11, %f416;
	mul.f32 	%f424, %f12, %f416;
	mul.f32 	%f425, %f8, %f11;
	mul.f32 	%f426, %f9, %f12;
	sub.f32 	%f427, %f425, %f426;
	fma.rn.f32 	%f428, %f427, %f30, %f422;
	mul.f32 	%f429, %f7, %f12;
	mul.f32 	%f430, %f8, %f10;
	sub.f32 	%f431, %f429, %f430;
	fma.rn.f32 	%f432, %f431, %f30, %f423;
	mul.f32 	%f433, %f9, %f10;
	mul.f32 	%f434, %f7, %f11;
	sub.f32 	%f435, %f433, %f434;
	fma.rn.f32 	%f436, %f435, %f30, %f424;
	fma.rn.f32 	%f1357, %f7, %f421, %f428;
	fma.rn.f32 	%f1358, %f9, %f421, %f432;
	fma.rn.f32 	%f1359, %f8, %f421, %f436;

$L__BB0_27:
	ld.const.u64 	%rd80, [params+176];
	cvta.to.global.u64 	%rd81, %rd80;
	ld.const.u32 	%r244, [params+168];
	mad.lo.s32 	%r245, %r244, %r156, %r155;
	mul.wide.u32 	%rd82, %r245, 12;
	add.s64 	%rd15, %rd81, %rd82;
	ld.global.f32 	%f53, [%rd15+4];
	ld.global.f32 	%f54, [%rd15];
	add.f32 	%f495, %f54, %f53;
	ld.global.f32 	%f55, [%rd15+8];
	add.f32 	%f496, %f495, %f55;
	setp.eq.f32 	%p27, %f496, 0f00000000;
	mov.f32 	%f1363, 0f00000000;
	setp.ne.s32 	%p28, %r5, 0;
	mov.f32 	%f1366, 0fBF800000;
	and.pred  	%p29, %p28, %p27;
	mov.f32 	%f1364, %f1363;
	mov.f32 	%f1365, %f1363;
	mov.f32 	%f1367, %f1363;
	mov.f32 	%f1368, %f1363;
	mov.f32 	%f1369, %f1363;
	@%p29 bra 	$L__BB0_29;

	ld.const.u64 	%rd83, [params+64];
	mov.f32 	%f504, 0f6C4ECB8F;
	mov.f32 	%f505, 0f00000000;
	mov.u32 	%r279, 1;
	mov.u32 	%r282, 2;
	mov.u32 	%r284, 7;
	mov.u32 	%r288, 2139095039;
	mov.u32 	%r291, 1065353216;
	mov.u32 	%r316, 0;
	// begin inline asm
	call(%r246,%r247,%r248,%r249,%r250,%r251,%r252,%r253,%r254,%r255,%r256,%r257,%r258,%r259,%r260,%r261,%r262,%r263,%r264,%r265,%r266,%r267,%r268,%r269,%r270,%r271,%r272,%r273,%r274,%r275,%r276,%r277),_optix_trace_typed_32,(%r316,%rd83,%f1360,%f1361,%f1362,%f1357,%f1358,%f1359,%f505,%f504,%f505,%r279,%r316,%r316,%r282,%r316,%r284,%r316,%r316,%r316,%r288,%r291,%r291,%r291,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316,%r316);
	// end inline asm
	mov.b32 	%f1363, %r246;
	mov.b32 	%f1364, %r247;
	mov.b32 	%f1365, %r248;
	mov.b32 	%f1366, %r249;
	mov.b32 	%f1367, %r250;
	mov.b32 	%f1368, %r251;
	mov.b32 	%f1369, %r252;

$L__BB0_29:
	setp.ltu.f32 	%p30, %f1366, 0f00000000;
	@%p30 bra 	$L__BB0_125;
	bra.uni 	$L__BB0_30;

$L__BB0_125:
	selp.u16 	%rs16, 1, 0, %p5;
	mov.f32 	%f1423, 0f00000000;
	mov.f32 	%f1424, %f1423;
	mov.f32 	%f1425, %f1423;
	mov.f32 	%f1426, %f1423;
	mov.f32 	%f1427, %f1423;
	mov.f32 	%f1428, %f1423;
	mov.f32 	%f1429, %f1423;
	mov.f32 	%f1430, %f1423;
	mov.f32 	%f1431, %f1423;
	bra.uni 	$L__BB0_126;

$L__BB0_30:
	fma.rn.f32 	%f506, %f1357, %f1366, %f1360;
	fma.rn.f32 	%f507, %f1358, %f1366, %f1361;
	fma.rn.f32 	%f508, %f1359, %f1366, %f1362;
	mul.f32 	%f509, %f506, 0f3456BF95;
	mul.f32 	%f510, %f507, 0f3456BF95;
	mul.f32 	%f511, %f508, 0f3456BF95;
	abs.f32 	%f512, %f509;
	abs.f32 	%f513, %f510;
	abs.f32 	%f514, %f511;
	max.f32 	%f515, %f512, %f513;
	max.f32 	%f516, %f515, %f514;
	mov.f32 	%f517, 0f38D1B717;
	max.f32 	%f518, %f516, %f517;
	fma.rn.f32 	%f70, %f1363, %f518, %f506;
	fma.rn.f32 	%f71, %f1364, %f518, %f507;
	fma.rn.f32 	%f72, %f1365, %f518, %f508;
	ld.const.u64 	%rd84, [params+144];
	cvta.to.global.u64 	%rd85, %rd84;
	ld.const.u32 	%r317, [params+136];
	mad.lo.s32 	%r318, %r317, %r156, %r155;
	mul.wide.u32 	%rd86, %r318, 12;
	add.s64 	%rd87, %rd85, %rd86;
	st.global.f32 	[%rd87], %f70;
	st.global.f32 	[%rd87+4], %f71;
	st.global.f32 	[%rd87+8], %f72;
	ld.const.u64 	%rd88, [params+160];
	cvta.to.global.u64 	%rd89, %rd88;
	ld.const.u32 	%r319, [params+152];
	mad.lo.s32 	%r320, %r319, %r156, %r155;
	mul.wide.u32 	%rd90, %r320, 12;
	add.s64 	%rd91, %rd89, %rd90;
	st.global.f32 	[%rd91], %f1363;
	st.global.f32 	[%rd91+4], %f1364;
	st.global.f32 	[%rd91+8], %f1365;
	neg.f32 	%f519, %f1367;
	setp.lt.f32 	%p31, %f1367, 0f00000000;
	selp.f32 	%f520, %f519, %f1367, %p31;
	ld.const.f32 	%f521, [params+372];
	selp.f32 	%f522, %f521, 0f3F800000, %p31;
	cvt.rmi.f32.f32 	%f523, %f520;
	sub.f32 	%f524, %f520, %f523;
	cvt.rmi.f32.f32 	%f525, %f1368;
	sub.f32 	%f526, %f1368, %f525;
	cvt.rmi.f32.f32 	%f527, %f1369;
	sub.f32 	%f528, %f1369, %f527;
	mul.f32 	%f1426, %f522, %f524;
	mul.f32 	%f1427, %f522, %f526;
	mul.f32 	%f1428, %f522, %f528;
	mul.f32 	%f1423, %f523, 0f3B808081;
	mul.f32 	%f1424, %f525, 0f3B808081;
	mul.f32 	%f1425, %f527, 0f3B808081;
	setp.lt.s32 	%p32, %r5, 1;
	@%p32 bra 	$L__BB0_32;

	mul.f32 	%f1426, %f54, %f1426;
	mul.f32 	%f1427, %f53, %f1427;
	mul.f32 	%f1428, %f55, %f1428;
	mul.f32 	%f1423, %f54, %f1423;
	mul.f32 	%f1424, %f53, %f1424;
	mul.f32 	%f1425, %f55, %f1425;

$L__BB0_32:
	ld.const.u32 	%r42, [params+200];
	setp.eq.s32 	%p33, %r42, 0;
	mov.f32 	%f1431, 0f00000000;
	mov.f32 	%f1430, %f1431;
	mov.f32 	%f1429, %f1431;
	@%p33 bra 	$L__BB0_96;

	cvt.rn.f32.u32 	%f91, %r42;
	mul.f32 	%f532, %f3, %f91;
	cvt.rzi.u32.f32 	%r321, %f532;
	add.s32 	%r322, %r42, -1;
	min.u32 	%r323, %r321, %r322;
	ld.const.u64 	%rd92, [params+208];
	cvta.to.global.u64 	%rd93, %rd92;
	mul.wide.u32 	%rd94, %r323, 64;
	add.s64 	%rd16, %rd93, %rd94;
	ld.global.v4.f32 	{%f533, %f534, %f535, %f536}, [%rd16];
	ld.global.v4.f32 	{%f537, %f538, %f539, %f540}, [%rd16+16];
	ld.global.u64 	%rd17, [%rd16+48];
	setp.lt.f32 	%p34, %f533, 0f3F800000;
	@%p34 bra 	$L__BB0_65;
	bra.uni 	$L__BB0_34;

$L__BB0_65:
	fma.rn.f32 	%f648, %f534, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f649, %f535, 0f40000000, 0fBF800000;
	abs.f32 	%f650, %f648;
	mov.f32 	%f1391, 0f3F800000;
	sub.f32 	%f651, %f1391, %f650;
	abs.f32 	%f652, %f649;
	sub.f32 	%f653, %f651, %f652;
	neg.f32 	%f654, %f653;
	cvt.sat.f32.f32 	%f655, %f654;
	setp.ge.f32 	%p61, %f648, 0f00000000;
	neg.f32 	%f656, %f655;
	selp.f32 	%f657, %f656, %f655, %p61;
	add.f32 	%f658, %f648, %f657;
	setp.ge.f32 	%p62, %f649, 0f00000000;
	selp.f32 	%f659, %f656, %f655, %p62;
	add.f32 	%f660, %f649, %f659;
	mul.f32 	%f661, %f660, %f660;
	fma.rn.f32 	%f662, %f658, %f658, %f661;
	fma.rn.f32 	%f663, %f653, %f653, %f662;
	sqrt.rn.f32 	%f664, %f663;
	rcp.rn.f32 	%f665, %f664;
	mul.f32 	%f154, %f658, %f665;
	mul.f32 	%f155, %f660, %f665;
	mul.f32 	%f156, %f653, %f665;
	neg.f32 	%f157, %f155;
	neg.f32 	%f158, %f156;
	mul.f32 	%f666, %f1363, %f154;
	mul.f32 	%f667, %f1364, %f157;
	sub.f32 	%f668, %f667, %f666;
	mul.f32 	%f669, %f1365, %f156;
	sub.f32 	%f159, %f668, %f669;
	setp.leu.f32 	%p63, %f159, 0f00000000;
	setp.eq.s64 	%p64, %rd17, 0;
	or.pred  	%p65, %p64, %p63;
	mov.f32 	%f1392, %f1391;
	mov.f32 	%f1393, %f1391;
	mov.f32 	%f1394, %f159;
	@%p65 bra 	$L__BB0_67;

	ld.global.v4.f32 	{%f670, %f671, %f672, %f673}, [%rd16+32];
	abs.f32 	%f674, %f154;
	abs.f32 	%f675, %f156;
	setp.gt.f32 	%p66, %f674, %f675;
	selp.f32 	%f676, %f157, 0f00000000, %p66;
	selp.f32 	%f677, %f154, %f158, %p66;
	selp.f32 	%f678, 0f00000000, %f155, %p66;
	mul.f32 	%f679, %f677, %f677;
	fma.rn.f32 	%f680, %f676, %f676, %f679;
	fma.rn.f32 	%f681, %f678, %f678, %f680;
	sqrt.rn.f32 	%f682, %f681;
	rcp.rn.f32 	%f683, %f682;
	mul.f32 	%f684, %f676, %f683;
	mul.f32 	%f685, %f677, %f683;
	mul.f32 	%f686, %f678, %f683;
	mul.f32 	%f687, %f156, %f685;
	mul.f32 	%f688, %f155, %f686;
	sub.f32 	%f689, %f687, %f688;
	mul.f32 	%f690, %f154, %f686;
	mul.f32 	%f691, %f156, %f684;
	sub.f32 	%f692, %f690, %f691;
	mul.f32 	%f693, %f155, %f684;
	mul.f32 	%f694, %f154, %f685;
	sub.f32 	%f695, %f693, %f694;
	mul.f32 	%f696, %f71, %f692;
	fma.rn.f32 	%f697, %f70, %f689, %f696;
	fma.rn.f32 	%f698, %f72, %f695, %f697;
	fma.rn.f32 	%f701, %f670, %f698, %f672;
	mul.f32 	%f702, %f71, %f685;
	fma.rn.f32 	%f703, %f70, %f684, %f702;
	fma.rn.f32 	%f704, %f72, %f686, %f703;
	fma.rn.f32 	%f707, %f671, %f704, %f673;
	tex.2d.v4.f32.f32 	{%f1391, %f1392, %f1393, %f708}, [%rd17, {%f701, %f707}];
	max.f32 	%f709, %f1391, %f1392;
	max.f32 	%f710, %f709, %f1393;
	mul.f32 	%f1394, %f159, %f710;

$L__BB0_67:
	setp.le.f32 	%p67, %f1394, 0f00000000;
	mov.f32 	%f1402, 0f00000000;
	mov.f32 	%f1403, %f1402;
	mov.f32 	%f1404, %f1402;
	@%p67 bra 	$L__BB0_95;

	abs.f32 	%f715, %f154;
	abs.f32 	%f716, %f156;
	setp.gt.f32 	%p68, %f715, %f716;
	selp.f32 	%f717, %f157, 0f00000000, %p68;
	selp.f32 	%f718, %f154, %f158, %p68;
	selp.f32 	%f719, 0f00000000, %f155, %p68;
	mul.f32 	%f720, %f718, %f718;
	fma.rn.f32 	%f721, %f717, %f717, %f720;
	fma.rn.f32 	%f722, %f719, %f719, %f721;
	sqrt.rn.f32 	%f723, %f722;
	rcp.rn.f32 	%f724, %f723;
	mov.f32 	%f1401, 0f3F800000;
	mul.f32 	%f168, %f717, %f724;
	mul.f32 	%f169, %f718, %f724;
	mul.f32 	%f170, %f719, %f724;
	setp.ltu.f32 	%p69, %f537, 0f00000000;
	@%p69 bra 	$L__BB0_94;

	sqrt.rn.f32 	%f171, %f1;
	mul.f32 	%f172, %f2, 0f40C90FDB;
	mul.f32 	%f725, %f172, 0f3F22F983;
	cvt.rni.s32.f32 	%r765, %f725;
	cvt.rn.f32.s32 	%f726, %r765;
	mov.f32 	%f727, 0fBFC90FDA;
	fma.rn.f32 	%f728, %f726, %f727, %f172;
	mov.f32 	%f729, 0fB3A22168;
	fma.rn.f32 	%f730, %f726, %f729, %f728;
	mov.f32 	%f731, 0fA7C234C5;
	fma.rn.f32 	%f1398, %f726, %f731, %f730;
	abs.f32 	%f174, %f172;
	setp.ltu.f32 	%p70, %f174, 0f47CE4780;
	mov.u32 	%r761, %r765;
	mov.f32 	%f1395, %f1398;
	@%p70 bra 	$L__BB0_77;

	setp.eq.f32 	%p71, %f174, 0f7F800000;
	@%p71 bra 	$L__BB0_76;
	bra.uni 	$L__BB0_71;

$L__BB0_76:
	mov.f32 	%f734, 0f00000000;
	mul.rn.f32 	%f1395, %f172, %f734;
	mov.u32 	%r761, 0;
	bra.uni 	$L__BB0_77;

$L__BB0_34:
	abs.f32 	%f541, %f1363;
	abs.f32 	%f542, %f1365;
	setp.gt.f32 	%p35, %f541, %f542;
	neg.f32 	%f543, %f1364;
	selp.f32 	%f544, %f543, 0f00000000, %p35;
	neg.f32 	%f545, %f1365;
	selp.f32 	%f546, %f1363, %f545, %p35;
	selp.f32 	%f547, 0f00000000, %f1364, %p35;
	mul.f32 	%f548, %f546, %f546;
	fma.rn.f32 	%f549, %f544, %f544, %f548;
	fma.rn.f32 	%f550, %f547, %f547, %f549;
	sqrt.rn.f32 	%f551, %f550;
	rcp.rn.f32 	%f552, %f551;
	mul.f32 	%f102, %f544, %f552;
	mul.f32 	%f103, %f546, %f552;
	mul.f32 	%f104, %f547, %f552;
	sqrt.rn.f32 	%f105, %f1;
	mul.f32 	%f106, %f2, 0f40C90FDB;
	mul.f32 	%f553, %f106, 0f3F22F983;
	cvt.rni.s32.f32 	%r757, %f553;
	cvt.rn.f32.s32 	%f554, %r757;
	mov.f32 	%f555, 0fBFC90FDA;
	fma.rn.f32 	%f556, %f554, %f555, %f106;
	mov.f32 	%f557, 0fB3A22168;
	fma.rn.f32 	%f558, %f554, %f557, %f556;
	mov.f32 	%f559, 0fA7C234C5;
	fma.rn.f32 	%f1379, %f554, %f559, %f558;
	abs.f32 	%f108, %f106;
	setp.ltu.f32 	%p36, %f108, 0f47CE4780;
	mov.u32 	%r753, %r757;
	mov.f32 	%f1376, %f1379;
	@%p36 bra 	$L__BB0_42;

	setp.eq.f32 	%p37, %f108, 0f7F800000;
	@%p37 bra 	$L__BB0_41;
	bra.uni 	$L__BB0_36;

$L__BB0_41:
	mov.f32 	%f562, 0f00000000;
	mul.rn.f32 	%f1376, %f106, %f562;
	mov.u32 	%r753, 0;
	bra.uni 	$L__BB0_42;

$L__BB0_36:
	mov.b32 	%r44, %f106;
	bfe.u32 	%r325, %r44, 23, 8;
	add.s32 	%r45, %r325, -128;
	shl.b32 	%r326, %r44, 8;
	or.b32  	%r46, %r326, -2147483648;
	shr.u32 	%r47, %r45, 5;
	mov.u64 	%rd169, 0;
	mov.u32 	%r750, 0;
	mov.u64 	%rd168, __cudart_i2opi_f;
	mov.u64 	%rd167, %rd1;

$L__BB0_37:
	.pragma "nounroll";
	ld.global.nc.u32 	%r327, [%rd168];
	mad.wide.u32 	%rd97, %r327, %r46, %rd169;
	shr.u64 	%rd169, %rd97, 32;
	st.local.u32 	[%rd167], %rd97;
	add.s64 	%rd168, %rd168, 4;
	add.s64 	%rd167, %rd167, 4;
	add.s32 	%r750, %r750, 1;
	setp.ne.s32 	%p38, %r750, 6;
	@%p38 bra 	$L__BB0_37;

	st.local.u32 	[%rd1+24], %rd169;
	mov.u32 	%r328, 4;
	sub.s32 	%r50, %r328, %r47;
	mov.u32 	%r329, 6;
	sub.s32 	%r330, %r329, %r47;
	mul.wide.s32 	%rd98, %r330, 4;
	add.s64 	%rd99, %rd1, %rd98;
	ld.local.u32 	%r751, [%rd99];
	ld.local.u32 	%r752, [%rd99+-4];
	and.b32  	%r53, %r45, 31;
	setp.eq.s32 	%p39, %r53, 0;
	@%p39 bra 	$L__BB0_40;

	mov.u32 	%r331, 32;
	sub.s32 	%r332, %r331, %r53;
	shr.u32 	%r333, %r752, %r332;
	shl.b32 	%r334, %r751, %r53;
	add.s32 	%r751, %r333, %r334;
	mul.wide.s32 	%rd100, %r50, 4;
	add.s64 	%rd101, %rd1, %rd100;
	ld.local.u32 	%r335, [%rd101];
	shr.u32 	%r336, %r335, %r332;
	shl.b32 	%r337, %r752, %r53;
	add.s32 	%r752, %r336, %r337;

$L__BB0_40:
	and.b32  	%r338, %r44, -2147483648;
	shr.u32 	%r339, %r752, 30;
	shl.b32 	%r340, %r751, 2;
	or.b32  	%r341, %r339, %r340;
	shr.u32 	%r342, %r341, 31;
	shr.u32 	%r343, %r751, 30;
	add.s32 	%r344, %r342, %r343;
	neg.s32 	%r345, %r344;
	setp.eq.s32 	%p40, %r338, 0;
	selp.b32 	%r753, %r344, %r345, %p40;
	setp.ne.s32 	%p41, %r342, 0;
	xor.b32  	%r346, %r338, -2147483648;
	selp.b32 	%r347, %r346, %r338, %p41;
	selp.b32 	%r348, -1, 0, %p41;
	xor.b32  	%r349, %r341, %r348;
	shl.b32 	%r350, %r752, 2;
	xor.b32  	%r351, %r350, %r348;
	cvt.u64.u32 	%rd102, %r349;
	cvt.u64.u32 	%rd103, %r351;
	bfi.b64 	%rd104, %rd102, %rd103, 32, 32;
	cvt.rn.f64.s64 	%fd5, %rd104;
	mul.f64 	%fd6, %fd5, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f560, %fd6;
	setp.eq.s32 	%p42, %r347, 0;
	neg.f32 	%f561, %f560;
	selp.f32 	%f1376, %f560, %f561, %p42;

$L__BB0_42:
	add.s32 	%r60, %r753, 1;
	and.b32  	%r61, %r60, 1;
	setp.eq.s32 	%p43, %r61, 0;
	selp.f32 	%f112, %f1376, 0f3F800000, %p43;
	mul.rn.f32 	%f113, %f1376, %f1376;
	mov.f32 	%f1377, 0fB94D4153;
	@%p43 bra 	$L__BB0_44;

	mov.f32 	%f564, 0fBAB607ED;
	mov.f32 	%f565, 0f37CBAC00;
	fma.rn.f32 	%f1377, %f565, %f113, %f564;

$L__BB0_44:
	selp.f32 	%f566, 0f3C0885E4, 0f3D2AAABB, %p43;
	fma.rn.f32 	%f567, %f1377, %f113, %f566;
	selp.f32 	%f568, 0fBE2AAAA8, 0fBEFFFFFF, %p43;
	fma.rn.f32 	%f569, %f567, %f113, %f568;
	mov.f32 	%f570, 0f00000000;
	fma.rn.f32 	%f571, %f113, %f112, %f570;
	fma.rn.f32 	%f1378, %f569, %f571, %f112;
	and.b32  	%r353, %r60, 2;
	setp.eq.s32 	%p45, %r353, 0;
	@%p45 bra 	$L__BB0_46;

	mov.f32 	%f573, 0fBF800000;
	fma.rn.f32 	%f1378, %f1378, %f573, %f570;

$L__BB0_46:
	@%p36 bra 	$L__BB0_54;

	setp.eq.f32 	%p47, %f108, 0f7F800000;
	@%p47 bra 	$L__BB0_53;
	bra.uni 	$L__BB0_48;

$L__BB0_53:
	mov.f32 	%f576, 0f00000000;
	mul.rn.f32 	%f1379, %f106, %f576;
	mov.u32 	%r757, 0;
	bra.uni 	$L__BB0_54;

$L__BB0_48:
	mov.b32 	%r62, %f106;
	bfe.u32 	%r355, %r62, 23, 8;
	add.s32 	%r63, %r355, -128;
	shl.b32 	%r356, %r62, 8;
	or.b32  	%r64, %r356, -2147483648;
	shr.u32 	%r65, %r63, 5;
	mov.u64 	%rd172, 0;
	mov.u32 	%r754, 0;
	mov.u64 	%rd171, __cudart_i2opi_f;
	mov.u64 	%rd170, %rd1;

$L__BB0_49:
	.pragma "nounroll";
	ld.global.nc.u32 	%r357, [%rd171];
	mad.wide.u32 	%rd107, %r357, %r64, %rd172;
	shr.u64 	%rd172, %rd107, 32;
	st.local.u32 	[%rd170], %rd107;
	add.s64 	%rd171, %rd171, 4;
	add.s64 	%rd170, %rd170, 4;
	add.s32 	%r754, %r754, 1;
	setp.ne.s32 	%p48, %r754, 6;
	@%p48 bra 	$L__BB0_49;

	st.local.u32 	[%rd1+24], %rd172;
	mov.u32 	%r358, 4;
	sub.s32 	%r68, %r358, %r65;
	mov.u32 	%r359, 6;
	sub.s32 	%r360, %r359, %r65;
	mul.wide.s32 	%rd108, %r360, 4;
	add.s64 	%rd109, %rd1, %rd108;
	ld.local.u32 	%r755, [%rd109];
	ld.local.u32 	%r756, [%rd109+-4];
	and.b32  	%r71, %r63, 31;
	setp.eq.s32 	%p49, %r71, 0;
	@%p49 bra 	$L__BB0_52;

	mov.u32 	%r361, 32;
	sub.s32 	%r362, %r361, %r71;
	shr.u32 	%r363, %r756, %r362;
	shl.b32 	%r364, %r755, %r71;
	add.s32 	%r755, %r363, %r364;
	mul.wide.s32 	%rd110, %r68, 4;
	add.s64 	%rd111, %rd1, %rd110;
	ld.local.u32 	%r365, [%rd111];
	shr.u32 	%r366, %r365, %r362;
	shl.b32 	%r367, %r756, %r71;
	add.s32 	%r756, %r366, %r367;

$L__BB0_52:
	and.b32  	%r368, %r62, -2147483648;
	shr.u32 	%r369, %r756, 30;
	shl.b32 	%r370, %r755, 2;
	or.b32  	%r371, %r369, %r370;
	shr.u32 	%r372, %r371, 31;
	shr.u32 	%r373, %r755, 30;
	add.s32 	%r374, %r372, %r373;
	neg.s32 	%r375, %r374;
	setp.eq.s32 	%p50, %r368, 0;
	selp.b32 	%r757, %r374, %r375, %p50;
	setp.ne.s32 	%p51, %r372, 0;
	xor.b32  	%r376, %r368, -2147483648;
	selp.b32 	%r377, %r376, %r368, %p51;
	selp.b32 	%r378, -1, 0, %p51;
	xor.b32  	%r379, %r371, %r378;
	shl.b32 	%r380, %r756, 2;
	xor.b32  	%r381, %r380, %r378;
	cvt.u64.u32 	%rd112, %r379;
	cvt.u64.u32 	%rd113, %r381;
	bfi.b64 	%rd114, %rd112, %rd113, 32, 32;
	cvt.rn.f64.s64 	%fd7, %rd114;
	mul.f64 	%fd8, %fd7, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f574, %fd8;
	setp.eq.s32 	%p52, %r377, 0;
	neg.f32 	%f575, %f574;
	selp.f32 	%f1379, %f574, %f575, %p52;

$L__BB0_54:
	mul.f32 	%f122, %f105, %f1378;
	and.b32  	%r78, %r757, 1;
	setp.eq.s32 	%p53, %r78, 0;
	selp.f32 	%f123, %f1379, 0f3F800000, %p53;
	mul.rn.f32 	%f124, %f1379, %f1379;
	mov.f32 	%f1380, 0fB94D4153;
	@%p53 bra 	$L__BB0_56;

	mov.f32 	%f578, 0fBAB607ED;
	mov.f32 	%f579, 0f37CBAC00;
	fma.rn.f32 	%f1380, %f579, %f124, %f578;

$L__BB0_56:
	selp.f32 	%f580, 0f3C0885E4, 0f3D2AAABB, %p53;
	fma.rn.f32 	%f581, %f1380, %f124, %f580;
	selp.f32 	%f582, 0fBE2AAAA8, 0fBEFFFFFF, %p53;
	fma.rn.f32 	%f583, %f581, %f124, %f582;
	mov.f32 	%f1388, 0f00000000;
	fma.rn.f32 	%f585, %f124, %f123, %f1388;
	fma.rn.f32 	%f1381, %f583, %f585, %f123;
	and.b32  	%r383, %r757, 2;
	setp.eq.s32 	%p55, %r383, 0;
	@%p55 bra 	$L__BB0_58;

	mov.f32 	%f586, 0f00000000;
	mov.f32 	%f587, 0fBF800000;
	fma.rn.f32 	%f1381, %f1381, %f587, %f586;

$L__BB0_58:
	mul.f32 	%f591, %f122, %f122;
	mov.f32 	%f1382, 0f3F800000;
	sub.f32 	%f593, %f1382, %f591;
	mul.f32 	%f594, %f105, %f1381;
	mul.f32 	%f595, %f594, %f594;
	sub.f32 	%f596, %f593, %f595;
	max.f32 	%f597, %f1388, %f596;
	sqrt.rn.f32 	%f598, %f597;
	mul.f32 	%f599, %f102, %f594;
	mul.f32 	%f600, %f103, %f594;
	mul.f32 	%f601, %f104, %f594;
	mul.f32 	%f602, %f1365, %f103;
	mul.f32 	%f603, %f1364, %f104;
	sub.f32 	%f604, %f602, %f603;
	fma.rn.f32 	%f605, %f604, %f122, %f599;
	mul.f32 	%f606, %f1363, %f104;
	mul.f32 	%f607, %f1365, %f102;
	sub.f32 	%f608, %f606, %f607;
	fma.rn.f32 	%f609, %f608, %f122, %f600;
	mul.f32 	%f610, %f1364, %f102;
	mul.f32 	%f611, %f1363, %f103;
	sub.f32 	%f612, %f610, %f611;
	fma.rn.f32 	%f613, %f612, %f122, %f601;
	fma.rn.f32 	%f130, %f1363, %f598, %f605;
	fma.rn.f32 	%f131, %f1364, %f598, %f609;
	fma.rn.f32 	%f132, %f1365, %f598, %f613;
	setp.leu.f32 	%p56, %f131, 0f00000000;
	setp.neu.f32 	%p57, %f537, 0f00000000;
	and.pred  	%p58, %p57, %p56;
	mov.f32 	%f1389, %f1388;
	mov.f32 	%f1390, %f1388;
	@%p58 bra 	$L__BB0_62;

	mul.f32 	%f626, %f70, 0f3456BF95;
	abs.f32 	%f627, %f626;
	mul.f32 	%f628, %f71, 0f3456BF95;
	abs.f32 	%f629, %f628;
	mul.f32 	%f630, %f72, 0f3456BF95;
	abs.f32 	%f631, %f630;
	max.f32 	%f632, %f627, %f629;
	max.f32 	%f633, %f632, %f631;
	mov.f32 	%f634, 0f38D1B717;
	max.f32 	%f620, %f633, %f634;
	ld.const.u64 	%rd115, [params+64];
	mov.f32 	%f621, 0f6C4ECB8F;
	mov.f32 	%f622, 0f00000000;
	mov.u32 	%r420, 2;
	mov.u32 	%r422, 1;
	mov.u32 	%r423, 1065353216;
	mov.u32 	%r454, 0;
	// begin inline asm
	call(%r384,%r385,%r386,%r387,%r388,%r389,%r390,%r391,%r392,%r393,%r394,%r395,%r396,%r397,%r398,%r399,%r400,%r401,%r402,%r403,%r404,%r405,%r406,%r407,%r408,%r409,%r410,%r411,%r412,%r413,%r414,%r415),_optix_trace_typed_32,(%r454,%rd115,%f70,%f71,%f72,%f130,%f131,%f132,%f620,%f621,%f622,%r422,%r454,%r422,%r420,%r422,%r422,%r423,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454,%r454);
	// end inline asm
	setp.leu.f32 	%p59, %f534, 0f00000000;
	mov.f32 	%f1383, %f1382;
	mov.f32 	%f1384, %f1382;
	@%p59 bra 	$L__BB0_61;

	neg.f32 	%f635, %f132;
	neg.f32 	%f636, %f130;
	neg.f32 	%f637, %f131;
	tex.cube.v4.f32.f32 	{%f1382, %f1383, %f1384, %f638}, [%rd17, {%f635, %f637, %f636, %f636}];

$L__BB0_61:
	mov.b32 	%f639, %r384;
	fma.rn.f32 	%f1388, %f1382, %f639, 0f00000000;
	fma.rn.f32 	%f1389, %f1383, %f639, 0f00000000;
	fma.rn.f32 	%f1390, %f1384, %f639, 0f00000000;

$L__BB0_62:
	@%p32 bra 	$L__BB0_64;

	add.f32 	%f640, %f533, 0fBF800000;
	mul.f32 	%f641, %f640, 0f42C80000;
	mul.f32 	%f1388, %f641, %f1388;
	mul.f32 	%f1389, %f641, %f1389;
	mul.f32 	%f1390, %f641, %f1390;

$L__BB0_64:
	mul.f32 	%f642, %f538, %f1388;
	mul.f32 	%f1429, %f642, %f91;
	mul.f32 	%f643, %f539, %f1389;
	mul.f32 	%f1430, %f643, %f91;
	mul.f32 	%f644, %f540, %f1390;
	mul.f32 	%f1431, %f644, %f91;
	bra.uni 	$L__BB0_96;

$L__BB0_71:
	mov.b32 	%r112, %f172;
	bfe.u32 	%r456, %r112, 23, 8;
	add.s32 	%r113, %r456, -128;
	shl.b32 	%r457, %r112, 8;
	or.b32  	%r114, %r457, -2147483648;
	shr.u32 	%r115, %r113, 5;
	mov.u64 	%rd175, 0;
	mov.u32 	%r758, 0;
	mov.u64 	%rd174, __cudart_i2opi_f;
	mov.u64 	%rd173, %rd1;

$L__BB0_72:
	.pragma "nounroll";
	ld.global.nc.u32 	%r458, [%rd174];
	mad.wide.u32 	%rd118, %r458, %r114, %rd175;
	shr.u64 	%rd175, %rd118, 32;
	st.local.u32 	[%rd173], %rd118;
	add.s64 	%rd174, %rd174, 4;
	add.s64 	%rd173, %rd173, 4;
	add.s32 	%r758, %r758, 1;
	setp.ne.s32 	%p72, %r758, 6;
	@%p72 bra 	$L__BB0_72;

	st.local.u32 	[%rd1+24], %rd175;
	mov.u32 	%r459, 4;
	sub.s32 	%r118, %r459, %r115;
	mov.u32 	%r460, 6;
	sub.s32 	%r461, %r460, %r115;
	mul.wide.s32 	%rd119, %r461, 4;
	add.s64 	%rd120, %rd1, %rd119;
	ld.local.u32 	%r759, [%rd120];
	ld.local.u32 	%r760, [%rd120+-4];
	and.b32  	%r121, %r113, 31;
	setp.eq.s32 	%p73, %r121, 0;
	@%p73 bra 	$L__BB0_75;

	mov.u32 	%r462, 32;
	sub.s32 	%r463, %r462, %r121;
	shr.u32 	%r464, %r760, %r463;
	shl.b32 	%r465, %r759, %r121;
	add.s32 	%r759, %r464, %r465;
	mul.wide.s32 	%rd121, %r118, 4;
	add.s64 	%rd122, %rd1, %rd121;
	ld.local.u32 	%r466, [%rd122];
	shr.u32 	%r467, %r466, %r463;
	shl.b32 	%r468, %r760, %r121;
	add.s32 	%r760, %r467, %r468;

$L__BB0_75:
	and.b32  	%r469, %r112, -2147483648;
	shr.u32 	%r470, %r760, 30;
	shl.b32 	%r471, %r759, 2;
	or.b32  	%r472, %r470, %r471;
	shr.u32 	%r473, %r472, 31;
	shr.u32 	%r474, %r759, 30;
	add.s32 	%r475, %r473, %r474;
	neg.s32 	%r476, %r475;
	setp.eq.s32 	%p74, %r469, 0;
	selp.b32 	%r761, %r475, %r476, %p74;
	setp.ne.s32 	%p75, %r473, 0;
	xor.b32  	%r477, %r469, -2147483648;
	selp.b32 	%r478, %r477, %r469, %p75;
	selp.b32 	%r479, -1, 0, %p75;
	xor.b32  	%r480, %r472, %r479;
	shl.b32 	%r481, %r760, 2;
	xor.b32  	%r482, %r481, %r479;
	cvt.u64.u32 	%rd123, %r480;
	cvt.u64.u32 	%rd124, %r482;
	bfi.b64 	%rd125, %rd123, %rd124, 32, 32;
	cvt.rn.f64.s64 	%fd9, %rd125;
	mul.f64 	%fd10, %fd9, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f732, %fd10;
	setp.eq.s32 	%p76, %r478, 0;
	neg.f32 	%f733, %f732;
	selp.f32 	%f1395, %f732, %f733, %p76;

$L__BB0_77:
	add.s32 	%r128, %r761, 1;
	and.b32  	%r129, %r128, 1;
	setp.eq.s32 	%p77, %r129, 0;
	selp.f32 	%f178, %f1395, 0f3F800000, %p77;
	mul.rn.f32 	%f179, %f1395, %f1395;
	mov.f32 	%f1396, 0fB94D4153;
	@%p77 bra 	$L__BB0_79;

	mov.f32 	%f736, 0fBAB607ED;
	mov.f32 	%f737, 0f37CBAC00;
	fma.rn.f32 	%f1396, %f737, %f179, %f736;

$L__BB0_79:
	selp.f32 	%f738, 0f3C0885E4, 0f3D2AAABB, %p77;
	fma.rn.f32 	%f739, %f1396, %f179, %f738;
	selp.f32 	%f740, 0fBE2AAAA8, 0fBEFFFFFF, %p77;
	fma.rn.f32 	%f741, %f739, %f179, %f740;
	mov.f32 	%f742, 0f00000000;
	fma.rn.f32 	%f743, %f179, %f178, %f742;
	fma.rn.f32 	%f1397, %f741, %f743, %f178;
	and.b32  	%r484, %r128, 2;
	setp.eq.s32 	%p79, %r484, 0;
	@%p79 bra 	$L__BB0_81;

	mov.f32 	%f745, 0fBF800000;
	fma.rn.f32 	%f1397, %f1397, %f745, %f742;

$L__BB0_81:
	@%p70 bra 	$L__BB0_89;

	setp.eq.f32 	%p81, %f174, 0f7F800000;
	@%p81 bra 	$L__BB0_88;
	bra.uni 	$L__BB0_83;

$L__BB0_88:
	mov.f32 	%f748, 0f00000000;
	mul.rn.f32 	%f1398, %f172, %f748;
	mov.u32 	%r765, 0;
	bra.uni 	$L__BB0_89;

$L__BB0_83:
	mov.b32 	%r130, %f172;
	bfe.u32 	%r486, %r130, 23, 8;
	add.s32 	%r131, %r486, -128;
	shl.b32 	%r487, %r130, 8;
	or.b32  	%r132, %r487, -2147483648;
	shr.u32 	%r133, %r131, 5;
	mov.u64 	%rd178, 0;
	mov.u32 	%r762, 0;
	mov.u64 	%rd177, __cudart_i2opi_f;
	mov.u64 	%rd176, %rd1;

$L__BB0_84:
	.pragma "nounroll";
	ld.global.nc.u32 	%r488, [%rd177];
	mad.wide.u32 	%rd128, %r488, %r132, %rd178;
	shr.u64 	%rd178, %rd128, 32;
	st.local.u32 	[%rd176], %rd128;
	add.s64 	%rd177, %rd177, 4;
	add.s64 	%rd176, %rd176, 4;
	add.s32 	%r762, %r762, 1;
	setp.ne.s32 	%p82, %r762, 6;
	@%p82 bra 	$L__BB0_84;

	st.local.u32 	[%rd1+24], %rd178;
	mov.u32 	%r489, 4;
	sub.s32 	%r136, %r489, %r133;
	mov.u32 	%r490, 6;
	sub.s32 	%r491, %r490, %r133;
	mul.wide.s32 	%rd129, %r491, 4;
	add.s64 	%rd130, %rd1, %rd129;
	ld.local.u32 	%r763, [%rd130];
	ld.local.u32 	%r764, [%rd130+-4];
	and.b32  	%r139, %r131, 31;
	setp.eq.s32 	%p83, %r139, 0;
	@%p83 bra 	$L__BB0_87;

	mov.u32 	%r492, 32;
	sub.s32 	%r493, %r492, %r139;
	shr.u32 	%r494, %r764, %r493;
	shl.b32 	%r495, %r763, %r139;
	add.s32 	%r763, %r494, %r495;
	mul.wide.s32 	%rd131, %r136, 4;
	add.s64 	%rd132, %rd1, %rd131;
	ld.local.u32 	%r496, [%rd132];
	shr.u32 	%r497, %r496, %r493;
	shl.b32 	%r498, %r764, %r139;
	add.s32 	%r764, %r497, %r498;

$L__BB0_87:
	and.b32  	%r499, %r130, -2147483648;
	shr.u32 	%r500, %r764, 30;
	shl.b32 	%r501, %r763, 2;
	or.b32  	%r502, %r500, %r501;
	shr.u32 	%r503, %r502, 31;
	shr.u32 	%r504, %r763, 30;
	add.s32 	%r505, %r503, %r504;
	neg.s32 	%r506, %r505;
	setp.eq.s32 	%p84, %r499, 0;
	selp.b32 	%r765, %r505, %r506, %p84;
	setp.ne.s32 	%p85, %r503, 0;
	xor.b32  	%r507, %r499, -2147483648;
	selp.b32 	%r508, %r507, %r499, %p85;
	selp.b32 	%r509, -1, 0, %p85;
	xor.b32  	%r510, %r502, %r509;
	shl.b32 	%r511, %r764, 2;
	xor.b32  	%r512, %r511, %r509;
	cvt.u64.u32 	%rd133, %r510;
	cvt.u64.u32 	%rd134, %r512;
	bfi.b64 	%rd135, %rd133, %rd134, 32, 32;
	cvt.rn.f64.s64 	%fd11, %rd135;
	mul.f64 	%fd12, %fd11, 0d3BF921FB54442D19;
	cvt.rn.f32.f64 	%f746, %fd12;
	setp.eq.s32 	%p86, %r508, 0;
	neg.f32 	%f747, %f746;
	selp.f32 	%f1398, %f746, %f747, %p86;

$L__BB0_89:
	mul.f32 	%f188, %f171, %f1397;
	and.b32  	%r146, %r765, 1;
	setp.eq.s32 	%p87, %r146, 0;
	selp.f32 	%f189, %f1398, 0f3F800000, %p87;
	mul.rn.f32 	%f190, %f1398, %f1398;
	mov.f32 	%f1399, 0fB94D4153;
	@%p87 bra 	$L__BB0_91;

	mov.f32 	%f750, 0fBAB607ED;
	mov.f32 	%f751, 0f37CBAC00;
	fma.rn.f32 	%f1399, %f751, %f190, %f750;

$L__BB0_91:
	selp.f32 	%f752, 0f3C0885E4, 0f3D2AAABB, %p87;
	fma.rn.f32 	%f753, %f1399, %f190, %f752;
	selp.f32 	%f754, 0fBE2AAAA8, 0fBEFFFFFF, %p87;
	fma.rn.f32 	%f755, %f753, %f190, %f754;
	mov.f32 	%f756, 0f00000000;
	fma.rn.f32 	%f757, %f190, %f189, %f756;
	fma.rn.f32 	%f1400, %f755, %f757, %f189;
	and.b32  	%r514, %r765, 2;
	setp.eq.s32 	%p89, %r514, 0;
	@%p89 bra 	$L__BB0_93;

	mov.f32 	%f759, 0fBF800000;
	fma.rn.f32 	%f1400, %f1400, %f759, %f756;

$L__BB0_93:
	mul.f32 	%f769, %f188, %f188;
	mov.f32 	%f770, 0f3F800000;
	sub.f32 	%f771, %f770, %f769;
	mul.f32 	%f772, %f171, %f1400;
	mul.f32 	%f773, %f772, %f772;
	sub.f32 	%f774, %f771, %f773;
	max.f32 	%f775, %f756, %f774;
	sqrt.rn.f32 	%f776, %f775;
	mul.f32 	%f777, %f168, %f772;
	mul.f32 	%f778, %f169, %f772;
	mul.f32 	%f779, %f170, %f772;
	mul.f32 	%f780, %f155, %f170;
	mul.f32 	%f781, %f156, %f169;
	sub.f32 	%f782, %f781, %f780;
	fma.rn.f32 	%f783, %f782, %f188, %f777;
	mul.f32 	%f784, %f156, %f168;
	mul.f32 	%f785, %f154, %f170;
	sub.f32 	%f786, %f785, %f784;
	fma.rn.f32 	%f787, %f786, %f188, %f778;
	mul.f32 	%f788, %f154, %f169;
	mul.f32 	%f789, %f155, %f168;
	sub.f32 	%f790, %f789, %f788;
	fma.rn.f32 	%f791, %f790, %f188, %f779;
	fma.rn.f32 	%f792, %f154, %f776, %f783;
	fma.rn.f32 	%f793, %f155, %f776, %f787;
	fma.rn.f32 	%f794, %f156, %f776, %f791;
	add.f32 	%f795, %f154, %f792;
	add.f32 	%f796, %f155, %f793;
	add.f32 	%f797, %f156, %f794;
	mul.f32 	%f798, %f537, %f795;
	mul.f32 	%f799, %f537, %f796;
	mul.f32 	%f800, %f537, %f797;
	sub.f32 	%f801, %f798, %f154;
	sub.f32 	%f802, %f799, %f155;
	sub.f32 	%f803, %f800, %f156;
	mul.f32 	%f804, %f802, %f802;
	fma.rn.f32 	%f805, %f801, %f801, %f804;
	fma.rn.f32 	%f806, %f803, %f803, %f805;
	sqrt.rn.f32 	%f807, %f806;
	rcp.rn.f32 	%f808, %f807;
	mul.f32 	%f763, %f808, %f801;
	mul.f32 	%f764, %f808, %f802;
	mul.f32 	%f765, %f808, %f803;
	mul.f32 	%f809, %f70, 0f3456BF95;
	abs.f32 	%f810, %f809;
	mul.f32 	%f811, %f71, 0f3456BF95;
	abs.f32 	%f812, %f811;
	mul.f32 	%f813, %f72, 0f3456BF95;
	abs.f32 	%f814, %f813;
	max.f32 	%f815, %f810, %f812;
	max.f32 	%f816, %f815, %f814;
	mov.f32 	%f817, 0f38D1B717;
	max.f32 	%f766, %f816, %f817;
	ld.const.u64 	%rd136, [params+64];
	mov.f32 	%f767, 0f6C4ECB8F;
	mov.u32 	%r551, 2;
	mov.u32 	%r553, 1;
	mov.u32 	%r554, 1065353216;
	mov.u32 	%r585, 0;
	// begin inline asm
	call(%r515,%r516,%r517,%r518,%r519,%r520,%r521,%r522,%r523,%r524,%r525,%r526,%r527,%r528,%r529,%r530,%r531,%r532,%r533,%r534,%r535,%r536,%r537,%r538,%r539,%r540,%r541,%r542,%r543,%r544,%r545,%r546),_optix_trace_typed_32,(%r585,%rd136,%f70,%f71,%f72,%f763,%f764,%f765,%f766,%f767,%f756,%r553,%r585,%r553,%r551,%r553,%r553,%r554,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585,%r585);
	// end inline asm
	mov.b32 	%f1401, %r515;

$L__BB0_94:
	mul.f32 	%f818, %f533, 0f42C80000;
	mul.f32 	%f819, %f159, %f1401;
	mul.f32 	%f820, %f818, %f819;
	setp.gt.s32 	%p90, %r5, 0;
	selp.f32 	%f821, %f820, %f819, %p90;
	mul.f32 	%f822, %f538, %f1391;
	mul.f32 	%f823, %f539, %f1392;
	mul.f32 	%f824, %f540, %f1393;
	mul.f32 	%f1404, %f824, %f821;
	mul.f32 	%f1403, %f823, %f821;
	mul.f32 	%f1402, %f822, %f821;

$L__BB0_95:
	mul.f32 	%f1429, %f1402, %f91;
	mul.f32 	%f1430, %f1403, %f91;
	mul.f32 	%f1431, %f1404, %f91;

$L__BB0_96:
	ld.const.u32 	%r586, [params+204];
	setp.eq.s32 	%p91, %r586, 0;
	mov.u16 	%rs16, 0;
	@%p91 bra 	$L__BB0_126;

	ld.const.f32 	%f825, [params+308];
	sub.f32 	%f826, %f70, %f825;
	ld.const.v2.f32 	{%f827, %f828}, [params+312];
	sub.f32 	%f831, %f71, %f827;
	sub.f32 	%f832, %f72, %f828;
	ld.const.u64 	%rd137, [params+232];
	tex.cube.v4.u32.f32 	{%r147, %r148, %r149, %r150}, [%rd137, {%f826, %f831, %f832, %f832}];
	setp.eq.s32 	%p92, %r148, 0;
	@%p92 bra 	$L__BB0_126;

	cvt.rn.f32.u32 	%f210, %r148;
	mul.f32 	%f834, %f3, %f210;
	cvt.rzi.u32.f32 	%r587, %f834;
	add.s32 	%r588, %r148, -1;
	min.u32 	%r589, %r587, %r588;
	add.s32 	%r590, %r589, %r147;
	ld.const.u64 	%rd138, [params+240];
	cvta.to.global.u64 	%rd139, %rd138;
	mul.wide.s32 	%rd140, %r590, 4;
	add.s64 	%rd141, %rd139, %rd140;
	ld.const.u64 	%rd142, [params+216];
	cvta.to.global.u64 	%rd143, %rd142;
	ld.global.u32 	%r591, [%rd141];
	mul.wide.u32 	%rd144, %r591, 112;
	add.s64 	%rd145, %rd143, %rd144;
	ld.global.v4.f32 	{%f835, %f836, %f837, %f838}, [%rd145];
	ld.global.v4.f32 	{%f839, %f840, %f841, %f842}, [%rd145+16];
	ld.global.v4.f32 	{%f1415, %f1416, %f1417, %f848}, [%rd145+32];
	ld.global.v4.f32 	{%f849, %f850, %f851, %f1414}, [%rd145+48];
	ld.global.v4.f32 	{%f853, %f854, %f855, %f856}, [%rd145+64];
	ld.global.v4.u32 	{%r592, %r593, %r594, %r595}, [%rd145+80];
	mov.b32 	%f229, %r592;
	mov.b32 	%f230, %r593;
	mov.b32 	%f231, %r594;
	ld.global.u64 	%rd42, [%rd145+96];
	sub.f32 	%f232, %f836, %f70;
	sub.f32 	%f233, %f837, %f71;
	sub.f32 	%f234, %f838, %f72;
	mul.f32 	%f857, %f233, %f233;
	fma.rn.f32 	%f858, %f232, %f232, %f857;
	fma.rn.f32 	%f859, %f234, %f234, %f858;
	sqrt.rn.f32 	%f860, %f859;
	rcp.rn.f32 	%f861, %f860;
	mul.f32 	%f1411, %f232, %f861;
	mul.f32 	%f1412, %f233, %f861;
	mul.f32 	%f1413, %f234, %f861;
	mul.f32 	%f238, %f860, %f840;
	mul.f32 	%f239, %f860, %f842;
	mov.f32 	%f865, 0f40800000;
	abs.f32 	%f241, %f239;
	setp.lt.f32 	%p93, %f241, 0f00800000;
	mul.f32 	%f867, %f241, 0f4B800000;
	selp.f32 	%f868, %f867, %f241, %p93;
	selp.f32 	%f869, 0fC3170000, 0fC2FE0000, %p93;
	mov.b32 	%r599, %f868;
	and.b32  	%r600, %r599, 8388607;
	or.b32  	%r601, %r600, 1065353216;
	mov.b32 	%f870, %r601;
	shr.u32 	%r602, %r599, 23;
	cvt.rn.f32.u32 	%f871, %r602;
	add.f32 	%f872, %f869, %f871;
	setp.gt.f32 	%p94, %f870, 0f3FB504F3;
	mul.f32 	%f873, %f870, 0f3F000000;
	add.f32 	%f874, %f872, 0f3F800000;
	selp.f32 	%f875, %f874, %f872, %p94;
	selp.f32 	%f876, %f873, %f870, %p94;
	add.f32 	%f877, %f876, 0fBF800000;
	add.f32 	%f878, %f876, 0f3F800000;
	rcp.approx.ftz.f32 	%f879, %f878;
	add.f32 	%f880, %f877, %f877;
	mul.f32 	%f881, %f880, %f879;
	mul.f32 	%f882, %f881, %f881;
	mov.f32 	%f883, 0f3C4CAF63;
	mov.f32 	%f884, 0f3B18F0FE;
	fma.rn.f32 	%f885, %f884, %f882, %f883;
	mov.f32 	%f886, 0f3DAAAABD;
	fma.rn.f32 	%f887, %f885, %f882, %f886;
	mul.rn.f32 	%f888, %f887, %f882;
	mul.rn.f32 	%f889, %f888, %f881;
	sub.f32 	%f890, %f877, %f881;
	add.f32 	%f891, %f890, %f890;
	neg.f32 	%f892, %f881;
	fma.rn.f32 	%f893, %f892, %f877, %f891;
	mul.rn.f32 	%f894, %f879, %f893;
	add.f32 	%f895, %f889, %f881;
	sub.f32 	%f896, %f881, %f895;
	add.f32 	%f897, %f889, %f896;
	add.f32 	%f898, %f894, %f897;
	add.f32 	%f899, %f895, %f898;
	sub.f32 	%f900, %f895, %f899;
	add.f32 	%f901, %f898, %f900;
	mov.f32 	%f902, 0f3F317200;
	mul.rn.f32 	%f903, %f875, %f902;
	mov.f32 	%f904, 0f35BFBE8E;
	mul.rn.f32 	%f905, %f875, %f904;
	add.f32 	%f906, %f903, %f899;
	sub.f32 	%f907, %f903, %f906;
	add.f32 	%f908, %f899, %f907;
	add.f32 	%f909, %f901, %f908;
	add.f32 	%f910, %f905, %f909;
	add.f32 	%f911, %f906, %f910;
	sub.f32 	%f912, %f906, %f911;
	add.f32 	%f913, %f910, %f912;
	mul.rn.f32 	%f914, %f865, %f911;
	neg.f32 	%f915, %f914;
	fma.rn.f32 	%f916, %f865, %f911, %f915;
	fma.rn.f32 	%f917, %f865, %f913, %f916;
	mov.f32 	%f918, 0f00000000;
	fma.rn.f32 	%f919, %f918, %f911, %f917;
	add.rn.f32 	%f920, %f914, %f919;
	neg.f32 	%f921, %f920;
	add.rn.f32 	%f922, %f914, %f921;
	add.rn.f32 	%f923, %f922, %f919;
	mov.b32 	%r603, %f920;
	setp.eq.s32 	%p95, %r603, 1118925336;
	add.s32 	%r604, %r603, -1;
	mov.b32 	%f924, %r604;
	add.f32 	%f925, %f923, 0f37000000;
	selp.f32 	%f242, %f925, %f923, %p95;
	selp.f32 	%f926, %f924, %f920, %p95;
	mov.f32 	%f927, 0f3FB8AA3B;
	mul.rn.f32 	%f928, %f926, %f927;
	cvt.rzi.f32.f32 	%f929, %f928;
	abs.f32 	%f930, %f929;
	setp.gt.f32 	%p96, %f930, 0f42FC0000;
	mov.b32 	%r605, %f929;
	and.b32  	%r606, %r605, -2147483648;
	or.b32  	%r607, %r606, 1123811328;
	mov.b32 	%f931, %r607;
	selp.f32 	%f932, %f931, %f929, %p96;
	mov.f32 	%f933, 0fBF317218;
	fma.rn.f32 	%f934, %f932, %f933, %f926;
	mov.f32 	%f935, 0f3102E308;
	fma.rn.f32 	%f936, %f932, %f935, %f934;
	mul.f32 	%f937, %f936, 0f3FB8AA3B;
	add.f32 	%f938, %f932, 0f4B40007F;
	mov.b32 	%r608, %f938;
	shl.b32 	%r609, %r608, 23;
	mov.b32 	%f939, %r609;
	ex2.approx.ftz.f32 	%f940, %f937;
	mul.f32 	%f243, %f940, %f939;
	setp.eq.f32 	%p97, %f243, 0f7F800000;
	mov.f32 	%f1408, 0f7F800000;
	@%p97 bra 	$L__BB0_100;

	fma.rn.f32 	%f1408, %f243, %f242, %f243;

$L__BB0_100:
	mov.f32 	%f1344, 0f40000000;
	cvt.rzi.f32.f32 	%f1343, %f1344;
	add.f32 	%f1342, %f1343, %f1343;
	mov.f32 	%f1341, 0f40800000;
	sub.f32 	%f1340, %f1341, %f1342;
	abs.f32 	%f1339, %f1340;
	setp.lt.f32 	%p98, %f239, 0f00000000;
	setp.eq.f32 	%p99, %f1339, 0f3F800000;
	and.pred  	%p1, %p98, %p99;
	setp.eq.f32 	%p100, %f239, 0f00000000;
	@%p100 bra 	$L__BB0_104;
	bra.uni 	$L__BB0_101;

$L__BB0_104:
	add.f32 	%f945, %f239, %f239;
	selp.f32 	%f1410, %f945, 0f00000000, %p99;
	bra.uni 	$L__BB0_105;

$L__BB0_101:
	mov.b32 	%r610, %f1408;
	xor.b32  	%r611, %r610, -2147483648;
	mov.b32 	%f941, %r611;
	selp.f32 	%f1410, %f941, %f1408, %p1;
	setp.geu.f32 	%p101, %f239, 0f00000000;
	@%p101 bra 	$L__BB0_105;

	mov.f32 	%f942, 0f40800000;
	cvt.rzi.f32.f32 	%f943, %f942;
	setp.eq.f32 	%p102, %f943, 0f40800000;
	@%p102 bra 	$L__BB0_105;

	mov.f32 	%f1410, 0f7FFFFFFF;

$L__BB0_105:
	abs.f32 	%f1345, %f239;
	add.f32 	%f946, %f1345, 0f40800000;
	mov.b32 	%r612, %f946;
	setp.lt.s32 	%p104, %r612, 2139095040;
	@%p104 bra 	$L__BB0_110;

	abs.f32 	%f1349, %f239;
	setp.gtu.f32 	%p105, %f1349, 0f7F800000;
	@%p105 bra 	$L__BB0_109;
	bra.uni 	$L__BB0_107;

$L__BB0_109:
	add.f32 	%f1410, %f239, 0f40800000;
	bra.uni 	$L__BB0_110;

$L__BB0_107:
	abs.f32 	%f1350, %f239;
	setp.neu.f32 	%p106, %f1350, 0f7F800000;
	@%p106 bra 	$L__BB0_110;

	selp.f32 	%f1410, 0fFF800000, 0f7F800000, %p1;

$L__BB0_110:
	mov.f32 	%f947, 0f3F800000;
	sub.f32 	%f948, %f947, %f1410;
	setp.eq.f32 	%p107, %f239, 0f3F800000;
	selp.f32 	%f949, 0f00000000, %f948, %p107;
	cvt.sat.f32.f32 	%f950, %f949;
	fma.rn.f32 	%f951, %f238, %f238, %f841;
	div.rn.f32 	%f1418, %f950, %f951;
	mul.f32 	%f952, %f1364, %f1412;
	fma.rn.f32 	%f953, %f1363, %f1411, %f952;
	fma.rn.f32 	%f253, %f1365, %f1413, %f953;
	setp.eq.f32 	%p108, %f835, 0f3F800000;
	@%p108 bra 	$L__BB0_116;
	bra.uni 	$L__BB0_111;

$L__BB0_116:
	setp.eq.s64 	%p112, %rd42, 0;
	@%p112 bra 	$L__BB0_120;

	mul.f32 	%f976, %f229, %f1411;
	mul.f32 	%f977, %f230, %f1412;
	neg.f32 	%f978, %f977;
	sub.f32 	%f979, %f978, %f976;
	mul.f32 	%f980, %f231, %f1413;
	sub.f32 	%f258, %f979, %f980;
	setp.geu.f32 	%p113, %f1414, 0f00000000;
	@%p113 bra 	$L__BB0_119;

	sub.f32 	%f1348, %f838, %f72;
	sub.f32 	%f1347, %f836, %f70;
	sub.f32 	%f1346, %f837, %f71;
	mul.f32 	%f981, %f230, %f1346;
	fma.rn.f32 	%f982, %f229, %f1347, %f981;
	fma.rn.f32 	%f983, %f231, %f1348, %f982;
	rcp.rn.f32 	%f984, %f983;
	mul.f32 	%f1411, %f1347, %f984;
	mul.f32 	%f1412, %f1346, %f984;
	mul.f32 	%f1413, %f1348, %f984;
	neg.f32 	%f1414, %f1414;

$L__BB0_119:
	setp.gt.f32 	%p114, %f258, 0f00000000;
	selp.f32 	%f985, 0f3F800000, 0f00000000, %p114;
	mov.f32 	%f986, 0f3F800000;
	mul.f32 	%f987, %f850, %f1412;
	fma.rn.f32 	%f988, %f849, %f1411, %f987;
	mul.f32 	%f989, %f854, %f1412;
	fma.rn.f32 	%f990, %f853, %f1411, %f989;
	fma.rn.f32 	%f991, %f851, %f1413, %f988;
	fma.rn.f32 	%f992, %f855, %f1413, %f990;
	fma.rn.f32 	%f993, %f1414, %f991, 0f3F000000;
	sub.f32 	%f994, %f986, %f993;
	fma.rn.f32 	%f995, %f1414, %f992, 0f3F000000;
	tex.2d.v4.f32.f32 	{%f996, %f997, %f998, %f999}, [%rd42, {%f994, %f995}];
	mul.f32 	%f1000, %f985, %f996;
	mul.f32 	%f1001, %f985, %f997;
	mul.f32 	%f1002, %f985, %f998;
	mul.f32 	%f1415, %f1415, %f1000;
	mul.f32 	%f1416, %f1416, %f1001;
	mul.f32 	%f1417, %f1417, %f1002;
	bra.uni 	$L__BB0_120;

$L__BB0_111:
	setp.eq.f32 	%p109, %f835, 0f40000000;
	@%p109 bra 	$L__BB0_114;
	bra.uni 	$L__BB0_112;

$L__BB0_114:
	setp.eq.s64 	%p111, %rd42, 0;
	@%p111 bra 	$L__BB0_120;

	mul.f32 	%f963, %f850, %f1412;
	fma.rn.f32 	%f964, %f849, %f1411, %f963;
	mul.f32 	%f965, %f854, %f1412;
	fma.rn.f32 	%f966, %f853, %f1411, %f965;
	mul.f32 	%f967, %f230, %f1412;
	fma.rn.f32 	%f968, %f229, %f1411, %f967;
	fma.rn.f32 	%f969, %f851, %f1413, %f964;
	fma.rn.f32 	%f970, %f855, %f1413, %f966;
	fma.rn.f32 	%f971, %f231, %f1413, %f968;
	tex.cube.v4.f32.f32 	{%f972, %f973, %f974, %f975}, [%rd42, {%f969, %f970, %f971, %f971}];
	mul.f32 	%f1415, %f1415, %f972;
	mul.f32 	%f1416, %f1416, %f973;
	mul.f32 	%f1417, %f1417, %f974;
	bra.uni 	$L__BB0_120;

$L__BB0_112:
	setp.neu.f32 	%p110, %f835, 0f40800000;
	@%p110 bra 	$L__BB0_120;

	mul.f32 	%f954, %f229, %f1411;
	mul.f32 	%f955, %f230, %f1412;
	neg.f32 	%f956, %f955;
	sub.f32 	%f957, %f956, %f954;
	mul.f32 	%f958, %f231, %f1413;
	sub.f32 	%f959, %f957, %f958;
	fma.rn.f32 	%f960, %f848, %f959, %f1414;
	cvt.sat.f32.f32 	%f961, %f960;
	mul.f32 	%f962, %f961, %f961;
	mul.f32 	%f1418, %f1418, %f962;

$L__BB0_120:
	max.f32 	%f1006, %f1415, %f1416;
	max.f32 	%f1007, %f1006, %f1417;
	cvt.sat.f32.f32 	%f1008, %f253;
	mul.f32 	%f274, %f1008, %f1418;
	mul.f32 	%f1009, %f274, %f1007;
	setp.lt.f32 	%p115, %f1009, 0f3727C5AC;
	mov.f32 	%f1420, 0f00000000;
	mov.f32 	%f1421, %f1420;
	mov.f32 	%f1422, %f1420;
	@%p115 bra 	$L__BB0_124;

	setp.lt.s32 	%p116, %r595, 1;
	mov.f32 	%f1419, 0f3F800000;
	@%p116 bra 	$L__BB0_123;

	fma.rn.f32 	%f1020, %f1, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f1021, %f2, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f1022, %f3, 0f40000000, 0fBF800000;
	fma.rn.f32 	%f1023, %f1020, %f839, %f836;
	fma.rn.f32 	%f1024, %f1021, %f839, %f837;
	fma.rn.f32 	%f1025, %f1022, %f839, %f838;
	sub.f32 	%f1026, %f1023, %f70;
	sub.f32 	%f1027, %f1024, %f71;
	sub.f32 	%f1028, %f1025, %f72;
	mul.f32 	%f1029, %f1027, %f1027;
	fma.rn.f32 	%f1030, %f1026, %f1026, %f1029;
	fma.rn.f32 	%f1031, %f1028, %f1028, %f1030;
	sqrt.rn.f32 	%f1018, %f1031;
	rcp.rn.f32 	%f1032, %f1018;
	mul.f32 	%f1014, %f1026, %f1032;
	mul.f32 	%f1015, %f1027, %f1032;
	mul.f32 	%f1016, %f1028, %f1032;
	mul.f32 	%f1033, %f70, 0f3456BF95;
	abs.f32 	%f1034, %f1033;
	mul.f32 	%f1035, %f71, 0f3456BF95;
	abs.f32 	%f1036, %f1035;
	mul.f32 	%f1037, %f72, 0f3456BF95;
	abs.f32 	%f1038, %f1037;
	max.f32 	%f1039, %f1034, %f1036;
	max.f32 	%f1040, %f1039, %f1038;
	mov.f32 	%f1041, 0f38D1B717;
	max.f32 	%f1017, %f1040, %f1041;
	ld.const.u64 	%rd146, [params+64];
	mov.f32 	%f1019, 0f00000000;
	mov.u32 	%r649, 2;
	mov.u32 	%r651, 1;
	mov.u32 	%r652, 1065353216;
	mov.u32 	%r683, 0;
	// begin inline asm
	call(%r613,%r614,%r615,%r616,%r617,%r618,%r619,%r620,%r621,%r622,%r623,%r624,%r625,%r626,%r627,%r628,%r629,%r630,%r631,%r632,%r633,%r634,%r635,%r636,%r637,%r638,%r639,%r640,%r641,%r642,%r643,%r644),_optix_trace_typed_32,(%r683,%rd146,%f70,%f71,%f72,%f1014,%f1015,%f1016,%f1017,%f1018,%f1019,%r651,%r683,%r651,%r649,%r651,%r651,%r652,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683,%r683);
	// end inline asm
	mov.b32 	%f1419, %r613;

$L__BB0_123:
	ld.const.u32 	%r740, [params+340];
	mul.f32 	%f1042, %f274, %f1419;
	mul.f32 	%f1043, %f856, %f1042;
	setp.gt.s32 	%p117, %r740, 0;
	selp.f32 	%f1044, %f1043, %f1042, %p117;
	mul.f32 	%f1422, %f1417, %f1044;
	mul.f32 	%f1421, %f1416, %f1044;
	mul.f32 	%f1420, %f1415, %f1044;

$L__BB0_124:
	mov.u16 	%rs16, 0;
	fma.rn.f32 	%f1429, %f1420, %f210, %f1429;
	fma.rn.f32 	%f1430, %f1421, %f210, %f1430;
	fma.rn.f32 	%f1431, %f1422, %f210, %f1431;

$L__BB0_126:
	ld.const.u32 	%r741, [params+340];
	setp.eq.s32 	%p176, %r741, 0;
	abs.f32 	%f1054, %f1429;
	setp.le.f32 	%p119, %f1054, 0f7F800000;
	selp.f32 	%f1055, %f1429, 0f00000000, %p119;
	abs.f32 	%f1056, %f1430;
	setp.le.f32 	%p120, %f1056, 0f7F800000;
	selp.f32 	%f1057, %f1430, 0f00000000, %p120;
	abs.f32 	%f1058, %f1431;
	setp.le.f32 	%p121, %f1058, 0f7F800000;
	selp.f32 	%f1059, %f1431, 0f00000000, %p121;
	fma.rn.f32 	%f1435, %f1426, %f1055, %f1423;
	fma.rn.f32 	%f1436, %f1427, %f1057, %f1424;
	fma.rn.f32 	%f1437, %f1428, %f1059, %f1425;
	st.global.f32 	[%rd15], %f1426;
	st.global.f32 	[%rd15+4], %f1427;
	st.global.f32 	[%rd15+8], %f1428;
	ld.const.u64 	%rd147, [params+96];
	cvta.to.global.u64 	%rd148, %rd147;
	ld.const.u32 	%r684, [params+88];
	mad.lo.s32 	%r685, %r684, %r156, %r155;
	mul.wide.u32 	%rd149, %r685, 12;
	add.s64 	%rd43, %rd148, %rd149;
	@%p176 bra 	$L__BB0_128;

	ld.global.f32 	%f1060, [%rd43];
	add.f32 	%f1435, %f1435, %f1060;
	ld.global.f32 	%f1061, [%rd43+4];
	add.f32 	%f1436, %f1436, %f1061;
	ld.global.f32 	%f1062, [%rd43+8];
	add.f32 	%f1437, %f1437, %f1062;
	bra.uni 	$L__BB0_133;

$L__BB0_128:
	setp.eq.s16 	%p123, %rs16, 0;
	ld.const.u32 	%r153, [params+368];
	setp.lt.s32 	%p124, %r153, 0;
	or.pred  	%p125, %p123, %p124;
	@%p125 bra 	$L__BB0_133;

	ld.const.u64 	%rd150, [params+208];
	cvta.to.global.u64 	%rd151, %rd150;
	mul.wide.s32 	%rd152, %r153, 64;
	add.s64 	%rd153, %rd151, %rd152;
	ld.global.v4.f32 	{%f1063, %f1064, %f1065, %f1066}, [%rd153+16];
	ld.global.u64 	%rd44, [%rd153+48];
	setp.neu.f32 	%p126, %f1063, 0f00000000;
	setp.leu.f32 	%p127, %f1358, 0f00000000;
	and.pred  	%p128, %p127, %p126;
	@%p128 bra 	$L__BB0_133;

	setp.eq.s64 	%p129, %rd44, 0;
	mov.f32 	%f1432, 0f3F800000;
	mov.f32 	%f1433, %f1432;
	mov.f32 	%f1434, %f1432;
	@%p129 bra 	$L__BB0_132;

	neg.f32 	%f1070, %f1359;
	neg.f32 	%f1071, %f1357;
	neg.f32 	%f1072, %f1358;
	tex.cube.v4.f32.f32 	{%f1434, %f1433, %f1432, %f1073}, [%rd44, {%f1070, %f1072, %f1071, %f1071}];

$L__BB0_132:
	mul.f32 	%f1435, %f1064, %f1434;
	mul.f32 	%f1436, %f1065, %f1433;
	mul.f32 	%f1437, %f1066, %f1432;

$L__BB0_133:
	st.global.f32 	[%rd43], %f1435;
	st.global.f32 	[%rd43+4], %f1436;
	st.global.f32 	[%rd43+8], %f1437;
	ld.const.u64 	%rd154, [params+112];
	cvta.to.global.u64 	%rd155, %rd154;
	ld.const.u32 	%r686, [params+104];
	mad.lo.s32 	%r687, %r686, %r156, %r155;
	mul.wide.u32 	%rd156, %r687, 12;
	add.s64 	%rd45, %rd155, %rd156;
	ld.const.v2.u32 	{%r688, %r689}, [params+344];
	mov.b32 	%f1074, %r689;
	ld.global.f32 	%f1075, [%rd45];
	sub.f32 	%f1076, %f1435, %f1075;
	ld.global.f32 	%f1077, [%rd45+4];
	sub.f32 	%f1078, %f1436, %f1077;
	ld.global.f32 	%f1079, [%rd45+8];
	sub.f32 	%f1080, %f1437, %f1079;
	fma.rn.f32 	%f317, %f1076, %f1074, %f1075;
	fma.rn.f32 	%f318, %f1078, %f1074, %f1077;
	fma.rn.f32 	%f319, %f1080, %f1074, %f1079;
	setp.eq.s32 	%p130, %r688, 0;
	@%p130 bra 	$L__BB0_135;

	st.global.f32 	[%rd45], %f317;
	st.global.f32 	[%rd45+4], %f318;
	st.global.f32 	[%rd45+8], %f319;

$L__BB0_135:
	not.b32 	%r692, %r156;
	add.s32 	%r154, %r159, %r692;
	ld.const.f32 	%f1082, [params+324];
	mul.f32 	%f320, %f317, %f1082;
	mul.f32 	%f321, %f318, %f1082;
	mul.f32 	%f322, %f319, %f1082;
	mov.f32 	%f1083, 0f3E68BA2E;
	cvt.rzi.f32.f32 	%f1084, %f1083;
	add.f32 	%f1085, %f1084, %f1084;
	mov.f32 	%f1086, 0f3EE8BA2E;
	sub.f32 	%f1087, %f1086, %f1085;
	abs.f32 	%f323, %f1087;
	abs.f32 	%f324, %f320;
	setp.lt.f32 	%p131, %f324, 0f00800000;
	mul.f32 	%f1088, %f324, 0f4B800000;
	selp.f32 	%f1089, %f1088, %f324, %p131;
	selp.f32 	%f1090, 0fC3170000, 0fC2FE0000, %p131;
	mov.b32 	%r693, %f1089;
	and.b32  	%r694, %r693, 8388607;
	or.b32  	%r695, %r694, 1065353216;
	mov.b32 	%f1091, %r695;
	shr.u32 	%r696, %r693, 23;
	cvt.rn.f32.u32 	%f1092, %r696;
	add.f32 	%f1093, %f1090, %f1092;
	setp.gt.f32 	%p132, %f1091, 0f3FB504F3;
	mul.f32 	%f1094, %f1091, 0f3F000000;
	add.f32 	%f1095, %f1093, 0f3F800000;
	selp.f32 	%f1096, %f1095, %f1093, %p132;
	selp.f32 	%f1097, %f1094, %f1091, %p132;
	add.f32 	%f1098, %f1097, 0fBF800000;
	add.f32 	%f1099, %f1097, 0f3F800000;
	rcp.approx.ftz.f32 	%f1100, %f1099;
	add.f32 	%f1101, %f1098, %f1098;
	mul.f32 	%f1102, %f1101, %f1100;
	mul.f32 	%f1103, %f1102, %f1102;
	mov.f32 	%f1104, 0f3C4CAF63;
	mov.f32 	%f1105, 0f3B18F0FE;
	fma.rn.f32 	%f1106, %f1105, %f1103, %f1104;
	mov.f32 	%f1107, 0f3DAAAABD;
	fma.rn.f32 	%f1108, %f1106, %f1103, %f1107;
	mul.rn.f32 	%f1109, %f1108, %f1103;
	mul.rn.f32 	%f1110, %f1109, %f1102;
	sub.f32 	%f1111, %f1098, %f1102;
	add.f32 	%f1112, %f1111, %f1111;
	neg.f32 	%f1113, %f1102;
	fma.rn.f32 	%f1114, %f1113, %f1098, %f1112;
	mul.rn.f32 	%f1115, %f1100, %f1114;
	add.f32 	%f1116, %f1110, %f1102;
	sub.f32 	%f1117, %f1102, %f1116;
	add.f32 	%f1118, %f1110, %f1117;
	add.f32 	%f1119, %f1115, %f1118;
	add.f32 	%f1120, %f1116, %f1119;
	sub.f32 	%f1121, %f1116, %f1120;
	add.f32 	%f1122, %f1119, %f1121;
	mov.f32 	%f1123, 0f3F317200;
	mul.rn.f32 	%f1124, %f1096, %f1123;
	mov.f32 	%f1125, 0f35BFBE8E;
	mul.rn.f32 	%f1126, %f1096, %f1125;
	add.f32 	%f1127, %f1124, %f1120;
	sub.f32 	%f1128, %f1124, %f1127;
	add.f32 	%f1129, %f1120, %f1128;
	add.f32 	%f1130, %f1122, %f1129;
	add.f32 	%f1131, %f1126, %f1130;
	add.f32 	%f1132, %f1127, %f1131;
	sub.f32 	%f1133, %f1127, %f1132;
	add.f32 	%f1134, %f1131, %f1133;
	mul.rn.f32 	%f1135, %f1086, %f1132;
	neg.f32 	%f1136, %f1135;
	fma.rn.f32 	%f1137, %f1086, %f1132, %f1136;
	fma.rn.f32 	%f1138, %f1086, %f1134, %f1137;
	mov.f32 	%f1139, 0f00000000;
	fma.rn.f32 	%f1140, %f1139, %f1132, %f1138;
	add.rn.f32 	%f1141, %f1135, %f1140;
	neg.f32 	%f1142, %f1141;
	add.rn.f32 	%f1143, %f1135, %f1142;
	add.rn.f32 	%f1144, %f1143, %f1140;
	mov.b32 	%r697, %f1141;
	setp.eq.s32 	%p133, %r697, 1118925336;
	add.s32 	%r698, %r697, -1;
	mov.b32 	%f1145, %r698;
	add.f32 	%f1146, %f1144, 0f37000000;
	selp.f32 	%f325, %f1146, %f1144, %p133;
	selp.f32 	%f1147, %f1145, %f1141, %p133;
	mov.f32 	%f1148, 0f3FB8AA3B;
	mul.rn.f32 	%f1149, %f1147, %f1148;
	cvt.rzi.f32.f32 	%f1150, %f1149;
	abs.f32 	%f1151, %f1150;
	setp.gt.f32 	%p134, %f1151, 0f42FC0000;
	mov.b32 	%r699, %f1150;
	and.b32  	%r700, %r699, -2147483648;
	or.b32  	%r701, %r700, 1123811328;
	mov.b32 	%f1152, %r701;
	selp.f32 	%f1153, %f1152, %f1150, %p134;
	mov.f32 	%f1154, 0fBF317218;
	fma.rn.f32 	%f1155, %f1153, %f1154, %f1147;
	mov.f32 	%f1156, 0f3102E308;
	fma.rn.f32 	%f1157, %f1153, %f1156, %f1155;
	mul.f32 	%f1158, %f1157, 0f3FB8AA3B;
	add.f32 	%f1159, %f1153, 0f4B40007F;
	mov.b32 	%r702, %f1159;
	shl.b32 	%r703, %r702, 23;
	mov.b32 	%f1160, %r703;
	ex2.approx.ftz.f32 	%f1161, %f1158;
	mul.f32 	%f326, %f1161, %f1160;
	setp.eq.f32 	%p135, %f326, 0f7F800000;
	mov.f32 	%f1438, 0f7F800000;
	@%p135 bra 	$L__BB0_137;

	fma.rn.f32 	%f1438, %f326, %f325, %f326;

$L__BB0_137:
	setp.lt.f32 	%p136, %f320, 0f00000000;
	setp.eq.f32 	%p137, %f323, 0f3F800000;
	and.pred  	%p2, %p136, %p137;
	setp.eq.f32 	%p138, %f320, 0f00000000;
	@%p138 bra 	$L__BB0_141;
	bra.uni 	$L__BB0_138;

$L__BB0_141:
	add.f32 	%f1166, %f320, %f320;
	selp.f32 	%f1440, %f1166, 0f00000000, %p137;
	bra.uni 	$L__BB0_142;

$L__BB0_138:
	mov.b32 	%r704, %f1438;
	xor.b32  	%r705, %r704, -2147483648;
	mov.b32 	%f1162, %r705;
	selp.f32 	%f1440, %f1162, %f1438, %p2;
	setp.geu.f32 	%p139, %f320, 0f00000000;
	@%p139 bra 	$L__BB0_142;

	mov.f32 	%f1163, 0f3EE8BA2E;
	cvt.rzi.f32.f32 	%f1164, %f1163;
	setp.eq.f32 	%p140, %f1164, 0f3EE8BA2E;
	@%p140 bra 	$L__BB0_142;

	mov.f32 	%f1440, 0f7FFFFFFF;

$L__BB0_142:
	add.f32 	%f1167, %f324, 0f3EE8BA2E;
	mov.b32 	%r706, %f1167;
	setp.lt.s32 	%p142, %r706, 2139095040;
	@%p142 bra 	$L__BB0_147;

	setp.gtu.f32 	%p143, %f324, 0f7F800000;
	@%p143 bra 	$L__BB0_146;
	bra.uni 	$L__BB0_144;

$L__BB0_146:
	add.f32 	%f1440, %f320, 0f3EE8BA2E;
	bra.uni 	$L__BB0_147;

$L__BB0_144:
	setp.neu.f32 	%p144, %f324, 0f7F800000;
	@%p144 bra 	$L__BB0_147;

	selp.f32 	%f1440, 0fFF800000, 0f7F800000, %p2;

$L__BB0_147:
	setp.eq.f32 	%p145, %f320, 0f3F800000;
	selp.f32 	%f1169, 0f3F800000, %f1440, %p145;
	cvt.sat.f32.f32 	%f335, %f1169;
	abs.f32 	%f336, %f321;
	setp.lt.f32 	%p146, %f336, 0f00800000;
	mul.f32 	%f1170, %f336, 0f4B800000;
	selp.f32 	%f1171, %f1170, %f336, %p146;
	selp.f32 	%f1172, 0fC3170000, 0fC2FE0000, %p146;
	mov.b32 	%r707, %f1171;
	and.b32  	%r708, %r707, 8388607;
	or.b32  	%r709, %r708, 1065353216;
	mov.b32 	%f1173, %r709;
	shr.u32 	%r710, %r707, 23;
	cvt.rn.f32.u32 	%f1174, %r710;
	add.f32 	%f1175, %f1172, %f1174;
	setp.gt.f32 	%p147, %f1173, 0f3FB504F3;
	mul.f32 	%f1176, %f1173, 0f3F000000;
	add.f32 	%f1177, %f1175, 0f3F800000;
	selp.f32 	%f1178, %f1177, %f1175, %p147;
	selp.f32 	%f1179, %f1176, %f1173, %p147;
	add.f32 	%f1180, %f1179, 0fBF800000;
	add.f32 	%f1181, %f1179, 0f3F800000;
	rcp.approx.ftz.f32 	%f1182, %f1181;
	add.f32 	%f1183, %f1180, %f1180;
	mul.f32 	%f1184, %f1183, %f1182;
	mul.f32 	%f1185, %f1184, %f1184;
	mov.f32 	%f1186, 0f3C4CAF63;
	mov.f32 	%f1187, 0f3B18F0FE;
	fma.rn.f32 	%f1188, %f1187, %f1185, %f1186;
	mov.f32 	%f1189, 0f3DAAAABD;
	fma.rn.f32 	%f1190, %f1188, %f1185, %f1189;
	mul.rn.f32 	%f1191, %f1190, %f1185;
	mul.rn.f32 	%f1192, %f1191, %f1184;
	sub.f32 	%f1193, %f1180, %f1184;
	add.f32 	%f1194, %f1193, %f1193;
	neg.f32 	%f1195, %f1184;
	fma.rn.f32 	%f1196, %f1195, %f1180, %f1194;
	mul.rn.f32 	%f1197, %f1182, %f1196;
	add.f32 	%f1198, %f1192, %f1184;
	sub.f32 	%f1199, %f1184, %f1198;
	add.f32 	%f1200, %f1192, %f1199;
	add.f32 	%f1201, %f1197, %f1200;
	add.f32 	%f1202, %f1198, %f1201;
	sub.f32 	%f1203, %f1198, %f1202;
	add.f32 	%f1204, %f1201, %f1203;
	mov.f32 	%f1205, 0f3F317200;
	mul.rn.f32 	%f1206, %f1178, %f1205;
	mov.f32 	%f1207, 0f35BFBE8E;
	mul.rn.f32 	%f1208, %f1178, %f1207;
	add.f32 	%f1209, %f1206, %f1202;
	sub.f32 	%f1210, %f1206, %f1209;
	add.f32 	%f1211, %f1202, %f1210;
	add.f32 	%f1212, %f1204, %f1211;
	add.f32 	%f1213, %f1208, %f1212;
	add.f32 	%f1214, %f1209, %f1213;
	sub.f32 	%f1215, %f1209, %f1214;
	add.f32 	%f1216, %f1213, %f1215;
	mov.f32 	%f1217, 0f3EE8BA2E;
	mul.rn.f32 	%f1218, %f1217, %f1214;
	neg.f32 	%f1219, %f1218;
	fma.rn.f32 	%f1220, %f1217, %f1214, %f1219;
	fma.rn.f32 	%f1221, %f1217, %f1216, %f1220;
	mov.f32 	%f1222, 0f00000000;
	fma.rn.f32 	%f1223, %f1222, %f1214, %f1221;
	add.rn.f32 	%f1224, %f1218, %f1223;
	neg.f32 	%f1225, %f1224;
	add.rn.f32 	%f1226, %f1218, %f1225;
	add.rn.f32 	%f1227, %f1226, %f1223;
	mov.b32 	%r711, %f1224;
	setp.eq.s32 	%p148, %r711, 1118925336;
	add.s32 	%r712, %r711, -1;
	mov.b32 	%f1228, %r712;
	add.f32 	%f1229, %f1227, 0f37000000;
	selp.f32 	%f337, %f1229, %f1227, %p148;
	selp.f32 	%f1230, %f1228, %f1224, %p148;
	mov.f32 	%f1231, 0f3FB8AA3B;
	mul.rn.f32 	%f1232, %f1230, %f1231;
	cvt.rzi.f32.f32 	%f1233, %f1232;
	abs.f32 	%f1234, %f1233;
	setp.gt.f32 	%p149, %f1234, 0f42FC0000;
	mov.b32 	%r713, %f1233;
	and.b32  	%r714, %r713, -2147483648;
	or.b32  	%r715, %r714, 1123811328;
	mov.b32 	%f1235, %r715;
	selp.f32 	%f1236, %f1235, %f1233, %p149;
	mov.f32 	%f1237, 0fBF317218;
	fma.rn.f32 	%f1238, %f1236, %f1237, %f1230;
	mov.f32 	%f1239, 0f3102E308;
	fma.rn.f32 	%f1240, %f1236, %f1239, %f1238;
	mul.f32 	%f1241, %f1240, 0f3FB8AA3B;
	add.f32 	%f1242, %f1236, 0f4B40007F;
	mov.b32 	%r716, %f1242;
	shl.b32 	%r717, %r716, 23;
	mov.b32 	%f1243, %r717;
	ex2.approx.ftz.f32 	%f1244, %f1241;
	mul.f32 	%f338, %f1244, %f1243;
	setp.eq.f32 	%p150, %f338, 0f7F800000;
	mov.f32 	%f1441, 0f7F800000;
	@%p150 bra 	$L__BB0_149;

	fma.rn.f32 	%f1441, %f338, %f337, %f338;

$L__BB0_149:
	setp.lt.f32 	%p151, %f321, 0f00000000;
	and.pred  	%p3, %p151, %p137;
	setp.eq.f32 	%p153, %f321, 0f00000000;
	@%p153 bra 	$L__BB0_153;
	bra.uni 	$L__BB0_150;

$L__BB0_153:
	add.f32 	%f1249, %f321, %f321;
	selp.f32 	%f1443, %f1249, 0f00000000, %p137;
	bra.uni 	$L__BB0_154;

$L__BB0_150:
	mov.b32 	%r718, %f1441;
	xor.b32  	%r719, %r718, -2147483648;
	mov.b32 	%f1245, %r719;
	selp.f32 	%f1443, %f1245, %f1441, %p3;
	setp.geu.f32 	%p154, %f321, 0f00000000;
	@%p154 bra 	$L__BB0_154;

	mov.f32 	%f1246, 0f3EE8BA2E;
	cvt.rzi.f32.f32 	%f1247, %f1246;
	setp.eq.f32 	%p155, %f1247, 0f3EE8BA2E;
	@%p155 bra 	$L__BB0_154;

	mov.f32 	%f1443, 0f7FFFFFFF;

$L__BB0_154:
	add.f32 	%f1250, %f336, 0f3EE8BA2E;
	mov.b32 	%r720, %f1250;
	setp.lt.s32 	%p157, %r720, 2139095040;
	@%p157 bra 	$L__BB0_159;

	setp.gtu.f32 	%p158, %f336, 0f7F800000;
	@%p158 bra 	$L__BB0_158;
	bra.uni 	$L__BB0_156;

$L__BB0_158:
	add.f32 	%f1443, %f321, 0f3EE8BA2E;
	bra.uni 	$L__BB0_159;

$L__BB0_156:
	setp.neu.f32 	%p159, %f336, 0f7F800000;
	@%p159 bra 	$L__BB0_159;

	selp.f32 	%f1443, 0fFF800000, 0f7F800000, %p3;

$L__BB0_159:
	setp.eq.f32 	%p160, %f321, 0f3F800000;
	selp.f32 	%f1252, 0f3F800000, %f1443, %p160;
	cvt.sat.f32.f32 	%f347, %f1252;
	abs.f32 	%f348, %f322;
	setp.lt.f32 	%p161, %f348, 0f00800000;
	mul.f32 	%f1253, %f348, 0f4B800000;
	selp.f32 	%f1254, %f1253, %f348, %p161;
	selp.f32 	%f1255, 0fC3170000, 0fC2FE0000, %p161;
	mov.b32 	%r721, %f1254;
	and.b32  	%r722, %r721, 8388607;
	or.b32  	%r723, %r722, 1065353216;
	mov.b32 	%f1256, %r723;
	shr.u32 	%r724, %r721, 23;
	cvt.rn.f32.u32 	%f1257, %r724;
	add.f32 	%f1258, %f1255, %f1257;
	setp.gt.f32 	%p162, %f1256, 0f3FB504F3;
	mul.f32 	%f1259, %f1256, 0f3F000000;
	add.f32 	%f1260, %f1258, 0f3F800000;
	selp.f32 	%f1261, %f1260, %f1258, %p162;
	selp.f32 	%f1262, %f1259, %f1256, %p162;
	add.f32 	%f1263, %f1262, 0fBF800000;
	add.f32 	%f1264, %f1262, 0f3F800000;
	rcp.approx.ftz.f32 	%f1265, %f1264;
	add.f32 	%f1266, %f1263, %f1263;
	mul.f32 	%f1267, %f1266, %f1265;
	mul.f32 	%f1268, %f1267, %f1267;
	mov.f32 	%f1269, 0f3C4CAF63;
	mov.f32 	%f1270, 0f3B18F0FE;
	fma.rn.f32 	%f1271, %f1270, %f1268, %f1269;
	mov.f32 	%f1272, 0f3DAAAABD;
	fma.rn.f32 	%f1273, %f1271, %f1268, %f1272;
	mul.rn.f32 	%f1274, %f1273, %f1268;
	mul.rn.f32 	%f1275, %f1274, %f1267;
	sub.f32 	%f1276, %f1263, %f1267;
	add.f32 	%f1277, %f1276, %f1276;
	neg.f32 	%f1278, %f1267;
	fma.rn.f32 	%f1279, %f1278, %f1263, %f1277;
	mul.rn.f32 	%f1280, %f1265, %f1279;
	add.f32 	%f1281, %f1275, %f1267;
	sub.f32 	%f1282, %f1267, %f1281;
	add.f32 	%f1283, %f1275, %f1282;
	add.f32 	%f1284, %f1280, %f1283;
	add.f32 	%f1285, %f1281, %f1284;
	sub.f32 	%f1286, %f1281, %f1285;
	add.f32 	%f1287, %f1284, %f1286;
	mov.f32 	%f1288, 0f3F317200;
	mul.rn.f32 	%f1289, %f1261, %f1288;
	mov.f32 	%f1290, 0f35BFBE8E;
	mul.rn.f32 	%f1291, %f1261, %f1290;
	add.f32 	%f1292, %f1289, %f1285;
	sub.f32 	%f1293, %f1289, %f1292;
	add.f32 	%f1294, %f1285, %f1293;
	add.f32 	%f1295, %f1287, %f1294;
	add.f32 	%f1296, %f1291, %f1295;
	add.f32 	%f1297, %f1292, %f1296;
	sub.f32 	%f1298, %f1292, %f1297;
	add.f32 	%f1299, %f1296, %f1298;
	mov.f32 	%f1300, 0f3EE8BA2E;
	mul.rn.f32 	%f1301, %f1300, %f1297;
	neg.f32 	%f1302, %f1301;
	fma.rn.f32 	%f1303, %f1300, %f1297, %f1302;
	fma.rn.f32 	%f1304, %f1300, %f1299, %f1303;
	mov.f32 	%f1305, 0f00000000;
	fma.rn.f32 	%f1306, %f1305, %f1297, %f1304;
	add.rn.f32 	%f1307, %f1301, %f1306;
	neg.f32 	%f1308, %f1307;
	add.rn.f32 	%f1309, %f1301, %f1308;
	add.rn.f32 	%f1310, %f1309, %f1306;
	mov.b32 	%r725, %f1307;
	setp.eq.s32 	%p163, %r725, 1118925336;
	add.s32 	%r726, %r725, -1;
	mov.b32 	%f1311, %r726;
	add.f32 	%f1312, %f1310, 0f37000000;
	selp.f32 	%f349, %f1312, %f1310, %p163;
	selp.f32 	%f1313, %f1311, %f1307, %p163;
	mov.f32 	%f1314, 0f3FB8AA3B;
	mul.rn.f32 	%f1315, %f1313, %f1314;
	cvt.rzi.f32.f32 	%f1316, %f1315;
	abs.f32 	%f1317, %f1316;
	setp.gt.f32 	%p164, %f1317, 0f42FC0000;
	mov.b32 	%r727, %f1316;
	and.b32  	%r728, %r727, -2147483648;
	or.b32  	%r729, %r728, 1123811328;
	mov.b32 	%f1318, %r729;
	selp.f32 	%f1319, %f1318, %f1316, %p164;
	mov.f32 	%f1320, 0fBF317218;
	fma.rn.f32 	%f1321, %f1319, %f1320, %f1313;
	mov.f32 	%f1322, 0f3102E308;
	fma.rn.f32 	%f1323, %f1319, %f1322, %f1321;
	mul.f32 	%f1324, %f1323, 0f3FB8AA3B;
	add.f32 	%f1325, %f1319, 0f4B40007F;
	mov.b32 	%r730, %f1325;
	shl.b32 	%r731, %r730, 23;
	mov.b32 	%f1326, %r731;
	ex2.approx.ftz.f32 	%f1327, %f1324;
	mul.f32 	%f350, %f1327, %f1326;
	setp.eq.f32 	%p165, %f350, 0f7F800000;
	mov.f32 	%f1444, 0f7F800000;
	@%p165 bra 	$L__BB0_161;

	fma.rn.f32 	%f1444, %f350, %f349, %f350;

$L__BB0_161:
	setp.lt.f32 	%p166, %f322, 0f00000000;
	and.pred  	%p4, %p166, %p137;
	setp.eq.f32 	%p168, %f322, 0f00000000;
	@%p168 bra 	$L__BB0_165;
	bra.uni 	$L__BB0_162;

$L__BB0_165:
	add.f32 	%f1332, %f322, %f322;
	selp.f32 	%f1446, %f1332, 0f00000000, %p137;
	bra.uni 	$L__BB0_166;

$L__BB0_162:
	mov.b32 	%r732, %f1444;
	xor.b32  	%r733, %r732, -2147483648;
	mov.b32 	%f1328, %r733;
	selp.f32 	%f1446, %f1328, %f1444, %p4;
	setp.geu.f32 	%p169, %f322, 0f00000000;
	@%p169 bra 	$L__BB0_166;

	mov.f32 	%f1329, 0f3EE8BA2E;
	cvt.rzi.f32.f32 	%f1330, %f1329;
	setp.eq.f32 	%p170, %f1330, 0f3EE8BA2E;
	@%p170 bra 	$L__BB0_166;

	mov.f32 	%f1446, 0f7FFFFFFF;

$L__BB0_166:
	add.f32 	%f1333, %f348, 0f3EE8BA2E;
	mov.b32 	%r734, %f1333;
	setp.lt.s32 	%p172, %r734, 2139095040;
	@%p172 bra 	$L__BB0_171;

	setp.gtu.f32 	%p173, %f348, 0f7F800000;
	@%p173 bra 	$L__BB0_170;
	bra.uni 	$L__BB0_168;

$L__BB0_170:
	add.f32 	%f1446, %f322, 0f3EE8BA2E;
	bra.uni 	$L__BB0_171;

$L__BB0_168:
	setp.neu.f32 	%p174, %f348, 0f7F800000;
	@%p174 bra 	$L__BB0_171;

	selp.f32 	%f1446, 0fFF800000, 0f7F800000, %p4;

$L__BB0_171:
	setp.eq.f32 	%p175, %f322, 0f3F800000;
	selp.f32 	%f1334, 0f3F800000, %f1446, %p175;
	cvt.sat.f32.f32 	%f1335, %f1334;
	ld.const.u64 	%rd157, [params+80];
	cvta.to.global.u64 	%rd158, %rd157;
	ld.const.u32 	%r735, [params+72];
	mad.lo.s32 	%r736, %r735, %r154, %r155;
	mul.f32 	%f1336, %f335, 0f437F0000;
	cvt.rzi.u32.f32 	%r737, %f1336;
	mul.f32 	%f1337, %f347, 0f437F0000;
	cvt.rzi.u32.f32 	%r738, %f1337;
	mul.f32 	%f1338, %f1335, 0f437F0000;
	cvt.rzi.u32.f32 	%r739, %f1338;
	mul.wide.u32 	%rd159, %r736, 4;
	add.s64 	%rd160, %rd158, %rd159;
	cvt.u16.u32 	%rs11, %r739;
	cvt.u16.u32 	%rs12, %r738;
	cvt.u16.u32 	%rs13, %r737;
	mov.u16 	%rs14, 255;
	st.global.v4.u8 	[%rd160], {%rs13, %rs12, %rs11, %rs14};
	ret;

}

